diff --git a/.gitattributes b/.gitattributes
index 8794fdc0a5c..45b42096b9d 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -7,3 +7,19 @@
 /demos/build_demos_msvc.bat omz.package=w
 /demos/tests/** -omz.package
 /tools/downloader/tests/** -omz.package
+
+/ci/requirements-ac.txt omz.ci.job-for-change.ac
+/ci/requirements-ac-test.txt omz.ci.job-for-change.ac
+/ci/requirements-conversion.txt omz.ci.job-for-change.demos omz.ci.job-for-change.models
+/ci/requirements-demos.txt omz.ci.job-for-change.demos
+/ci/requirements-downloader.txt omz.ci.job-for-change.demos omz.ci.job-for-change.models
+
+/demos/** omz.ci.job-for-change.demos
+/demos/**/*.md -omz.ci.job-for-change.demos
+
+/models/** omz.ci.job-for-change.documentation
+/models/**/*.yml -omz.ci.job-for-change.documentation
+
+/tools/accuracy_checker/** omz.ci.job-for-change.ac
+/tools/downloader/** omz.ci.job-for-change.downloader
+/tools/**/*.md -omz.ci.job-for-change.ac -omz.ci.job-for-change.downloader
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
new file mode 100644
index 00000000000..ec208adb8b6
--- /dev/null
+++ b/CONTRIBUTING.md
@@ -0,0 +1,276 @@
+# How to Contribute Models to Open Model Zoo
+
+We appreciate your intention to contribute model to the OpenVINO&trade; Open Model Zoo (OMZ). OMZ is licensed under the Apache\* License, Version 2.0. By contributing to the project, you agree to the license and copyright terms therein and release your contribution under these terms. Note that we accept models under permissive licenses, such as **MIT**, **Apache 2.0**, and **BSD-3-Clause**. Otherwise, it might take longer time to get your model approved.
+
+Frameworks supported by the Open Model Zoo: 
+* Caffe\*
+* Caffe2\* (via conversion to ONNX\*)
+* TensorFlow\*
+* PyTorch\* (via conversion to ONNX\*)
+* MXNet\*
+
+Open Model Zoo also supports models already in the ONNX format.
+
+## Pull Request Requirements
+
+To contribute to OMZ, create a pull request (PR) in this repository using the `develop` branch.
+Pull requests are strictly formalized and are reviewed by the OMZ maintainers for consistence and legal compliance.
+
+Each PR contributing a model must contain:
+* [configuration file `model.yml`](#configuration-file)
+* [documentation of model in markdown format](#documentation)
+* [accuracy validation configuration file](#accuracy-validation)
+* (*optional*) [demo](#demo)
+
+Follow the rules in the sections below before submitting a pull request.
+
+### Model Name
+
+Name your model in OMZ according to the following rules:
+- Use a name that is consistent with an original name, but complete match is not necessary
+- Use lowercase
+- Use `-`(preferable) or `_` as delimiters, for spaces are not allowed
+- Add a suffix according to framework identifier (see **`framework`** description in the [configuration file](#configuration-file) section for examples), if the model is a reimplementation of an existing model from another framework
+
+This name will be used for downloading, converting, and other operations.
+Examples of model names:
+- `resnet-50-pytorch`
+- `mobilenet-v2-1.0-224`
+
+### Files Location
+
+Place your files as shown in the table below:
+
+File | Destination
+---|---
+configuration file | `models/public/<model_name>/model.yml`
+documentation file | `models/public/<model_name>/<model_name>.md`
+validation configuration file|`tools/accuracy_checker/configs/<model_name>.yml`
+demo|`demos/<demo_name>`<br>or<br>`demos/python_demos/<demo_name>`
+
+### Tests
+
+Your PR must pass next tests:
+* Model is downloadable by the `tools/downloader/downloader.py` script. See [Configuration file](#configuration-file) for details.
+* Model is convertible by the `tools/downloader/converter.py` script. See [Model conversion](#model-conversion) for details.
+* Model is usable by demo or sample and provides adequate results. See [Demo](#demo) for details.
+* Model passes accuracy validation. See [Accuracy validation](#accuracy-validation) for details.
+
+
+### PR Rejection
+
+Your PR may be rejected in some cases, for example:
+* If a license is inappropriate (such as GPL-like licenses).
+* If a dataset is inaccessible.
+* If the PR fails one of the tests above.
+
+## Configuration File
+
+The model configuration file contains information about model: what it is, how to download it, and how to convert it to the IR format. This information must be specified in the `model.yml` file that must be located in the model subfolder. 
+
+The detailed descriptions of file entries provided below.
+
+**`description`**
+
+Description of the model. Must match with the description from the model [documentation](#documentation).
+
+**`task_type`**
+
+[Model task type](tools/downloader/README.md#model-information-dumper-usage). If there is no task type of your model, add a new one to the list `KNOWN_TASK_TYPES` of the [tools/downloader/common.py](tools/downloader/common.py) file.
+
+**`files`**
+
+> **NOTE**: Before filling this section, make sure that the model can be downloaded either via a direct HTTP(S) link or from Google Drive\*.
+
+Downloadable files. Each file is described by:
+
+* `name` - sets a file name after downloading
+* `size` - sets a file size
+* `sha256`  - sets a file hash sum
+* `source` - sets a direct link to a file *OR* describes a file access parameters
+
+> **TIP**: You can obtain a hash sum using the `sha256sum <file_name>` command on Linux\*.
+ 
+If file is located on Google Drive\*, the `source` section must contain:
+- `$type: google_drive`
+- `id` file ID on Google Drive\*
+
+> **NOTE:** If file is on GitHub\*, use the specific file version.
+
+**`postprocessing`** (*optional*)
+
+Post processing of the downloaded files.
+
+For unpacking archive:
+- `$type: unpack_archive`
+- `file` — Archive file name
+- `format` — Archive format (zip | tar | gztar | bztar | xztar)
+
+For replacement operation:
+- `$type: regex_replace`
+- `file` — Name of file to run replacement in
+- `pattern` — [Regular expression](https://docs.python.org/3/library/re.html)
+- `replacement` — Replacement string
+- `count` (*optional*)  — Exact number of replacements (if number of `pattern` occurrences less then this number, downloading will be aborted)
+
+**`conversion_to_onnx_args`** (*only for Caffe2\*, PyTorch\* models*)
+
+List of ONNX\* conversion parameters, see `model_optimizer_args` for details.
+
+**`model_optimizer_args`**
+
+Conversion parameters (learn more in the [Model conversion](#model-conversion) section). For example:
+```
+  - --input=data
+  - --mean_values=data[127.5]
+  - --scale_values=data[127.5]
+  - --reverse_input_channels
+  - --output=prob
+  - --input_model=$conv_dir/googlenet-v3.onnx
+```
+
+> **NOTE:** Do not specify `framework`, `data_type`, `model_name` and `output_dir`, since they are deduced automatically.
+
+> **NOTE:** `$dl_dir` used to substitute subdirectory of downloaded model and `$conv_dir` used to substitute subdirectory of converted model.
+
+**`framework`**
+
+Framework of the original model (see [here](tools/downloader/README.md#model-information-dumper-usage) for details).
+
+**`license`**
+
+URL of the model license.
+
+### Example
+
+This example shows how to download the classification model [DenseNet-121*](models/public/densenet-121-tf/model.yml) pretrained in TensorFlow\* from Google Drive\* as an archive.
+
+```
+description: >-
+  This is a TensorFlow\* version of `densenet-121` model, one of the DenseNet
+  group of models designed to perform image classification. The weights were converted
+  from DenseNet-Keras Models. For details see repository <https://github.com/pudae/tensorflow-densenet/>,
+  paper <https://arxiv.org/pdf/1608.06993.pdf>
+task_type: classification
+files:
+  - name: tf-densenet121.tar.gz
+    size: 30597420
+    sha256: b31ec840358f1d20e1c6364d05ce463cb0bc0480042e663ad54547189501852d
+    source:
+      $type: google_drive
+      id: 0B_fUSpodN0t0eW1sVk1aeWREaDA
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: tf-densenet121.tar.gz
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,224,224,3]
+  - --input=Placeholder
+  - --mean_values=Placeholder[123.68,116.78,103.94]
+  - --scale_values=Placeholder[58.8235294117647]
+  - --output=densenet121/predictions/Reshape_1
+  - --input_meta_graph=$dl_dir/tf-densenet121.ckpt.meta
+framework: tf
+license: https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE
+```
+
+## Model Conversion
+
+Deep Learning Inference Engine (IE) supports models in the Intermediate Representation (IR) format. A model from any supported framework can be converted to IR using the Model Optimizer tool included in the OpenVINO&trade; toolkit. Find more information about conversion in the [Model Optimizer Developer Guide](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html). After a successful conversion you get a model in the IR format, with the `*.xml` file representing the net graph and the `*.bin` file containing the net parameters. 
+
+> **NOTE 1**: Image preprocessing parameters (mean and scale) must be built into a converted model to simplify model usage.
+
+> **NOTE 2**: If a model input is a color image, color channel order should be `BGR`.
+
+## Demo
+
+A demo shows the main idea of how to infer a model using IE. If your model solves one of the tasks supported by the Open Model Zoo, try to find an appropriate option from [demos](demos/README.md) or [samples](https://docs.openvinotoolkit.org/latest/_docs_IE_DG_Samples_Overview.html). Otherwise, you must provide your own demo (C++ or Python). 
+
+The demo's name should end with `_demo` suffix to follow the convention of the project.
+
+Demos are required to support the following keys:
+
+ -  `-i "<input>"`: Required. Input to process.
+ -  `-m "<path>"`: Required. Path to an .xml file with a trained model. If the demo uses several models at the same time, use other keys prefixed with `-m_`.
+ -  `-d "<device>"`: Optional. Specifies a target device to infer on. CPU, GPU, FPGA, HDDL or MYRIAD is acceptable. Default must be CPU. If the demo uses several models at the same time, use keys prefixed with `d_` (just like keys `m_*` above) to specify device for each model.
+ -  `-no_show`: Optional. Do not visualize inference results.
+
+> **TIP**: For Python, it is preferable to use `--` instead of `-` for long keys.
+
+You can also add any other necessary parameters.
+
+Add `README.md` file, which describes demo usage. Update [demos' README.md](demos/README.md) adding your demo to the list.
+
+## Accuracy Validation
+
+Accuracy validation can be performed by the [Accuracy Checker](./tools/accuracy_checker) tool. This tool can use either IE to run a converted model, or an original framework to run an original model. Accuracy Checker supports lots of datasets, metrics and preprocessing options, which simplifies validation if a task is supported by the tool. You only need to create a configuration file that contains necessary parameters for accuracy validation (specify a dataset and annotation, pre- and post-processing parameters, accuracy metrics to compute and so on) of converted model. For details, refer to [Testing new models](./tools/accuracy_checker#testing-new-models).
+
+If a model uses a dataset which is not supported by the Accuracy Checker, you also must provide the license and the link to it and mention it in the PR description. 
+
+When the configuration file is ready, you must run the Accuracy Checker to obtain metric results. If they match your results, that means conversion was successful and the Accuracy Checker fully supports your model, metric and dataset. Otherwise, recheck the [conversion](#model-conversion) parameters or the validation configuration file.
+
+### Example
+
+This example uses one of the files from `tools/accuracy_checker/configs` — validation configuration file for [DenseNet-121](tools/accuracy_checker/configs/densenet-121-tf.yml)\* from TensorFlow\*:
+```
+models:
+  - name: densenet-121-tf
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/densenet-121-tf/FP32/densenet-121-tf.xml
+        weights: public/densenet-121-tf/FP32/densenet-121-tf.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/densenet-121-tf/FP16/densenet-121-tf.xml
+        weights: public/densenet-121-tf/FP16/densenet-121-tf.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+          - type: crop
+            size: 224
+```
+
+
+## Documentation
+
+Documentation is a very important part of model contribution as it helps to better understand the possible usage of the model. Documentation must be named in accordance with the name of the model.
+The documentation should contain:
+* description of a model
+	* main purpose
+	* features
+	* references to a paper or/and a source
+* model specification
+	* type
+	* framework
+	* GFLOPs (*if available*)
+	* number of parameters (*if available*)
+* validation dataset description and/or a link
+* main accuracy values (also description of a metric)
+* detailed description of input and output for original and converted models
+* the model's licensing terms
+
+Learn the detailed structure and headers naming convention from any model documentation (for example, [alexnet](./models/public/alexnet/alexnet.md)).
+
+## Legal Information
+
+[\*] Other names and brands may be claimed as the property of others.
+
+OpenVINO is a trademark of Intel Corporation or its subsidiaries in the U.S. and/or other countries.
+
+Copyright &copy; 2018-2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at
+```
+http://www.apache.org/licenses/LICENSE-2.0
+```
+Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License.
diff --git a/README.md b/README.md
index 1cd0e48b614..cfd71e8c23a 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,5 @@
 # [OpenVINO™ Toolkit](https://01.org/openvinotoolkit) - Open Model Zoo repository
-[![Build Status](http://134.191.240.124/buildStatus/icon?job=omz/2018/trigger)](http://134.191.240.124/job/omz/job/2018/job/trigger/)
-[![Stable release](https://img.shields.io/badge/version-2019_R3.1-green.svg)](https://github.com/opencv/open_model_zoo/releases/tag/2019_R3.1)
+[![Stable release](https://img.shields.io/badge/version-2020.2-green.svg)](https://github.com/opencv/open_model_zoo/releases/tag/2020.2)
 [![Gitter chat](https://badges.gitter.im/gitterHQ/gitter.png)](https://gitter.im/open_model_zoo/community)
 [![Apache License Version 2.0](https://img.shields.io/badge/license-Apache_2.0-green.svg)](LICENSE)
 
@@ -34,6 +33,8 @@ We welcome community contributions to the Open Model Zoo repository. If you have
 * In case of a larger feature, provide a relevant demo.
 * Submit a pull request at https://github.com/opencv/open_model_zoo/pulls
 
+You can find additional information about model contribution [here](CONTRIBUTING.md).
+
 We will review your contribution and, if any additional fixes or modifications are needed, may give you feedback to guide you. When accepted, your pull request will be merged into the GitHub* repositories.
 
 Open Model Zoo is licensed under Apache License, Version 2.0. By contributing to the project, you agree to the license and copyright terms therein and release your contribution under these terms.
diff --git a/ci/get-jobs-for-changes.py b/ci/get-jobs-for-changes.py
new file mode 100755
index 00000000000..829a4f8f0a6
--- /dev/null
+++ b/ci/get-jobs-for-changes.py
@@ -0,0 +1,72 @@
+#!/usr/bin/python3
+
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+A script that prints a JSON description of the CI jobs necessary to validate
+the changes made between a base commit and the current commit.
+
+The output format is a an object where each key is the identifier of the job
+and the corresponding value represents that job's parameters. The value
+is usually just "true" (which just means that the job should be run), but
+for the "models" job the value can be an array of names of models that should
+be validated.
+"""
+
+import argparse
+import json
+import re
+import subprocess
+import sys
+
+from pathlib import Path, PurePosixPath
+
+RE_ATTRIB_NAME = re.compile(r"omz\.ci\.job-for-change\.(.+)")
+
+def group_by_n(iterable, n):
+    return zip(*[iter(iterable)] * n)
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('base_commit', metavar='COMMIT')
+    args = parser.parse_args()
+
+    git_diff_output = subprocess.check_output(
+        ["git", "diff", "--name-only", "-z", args.base_commit + "...HEAD"])
+    changed_files = list(map(PurePosixPath, git_diff_output.decode()[:-1].split("\0")))
+
+    models_dir = PurePosixPath("models")
+
+    jobs = {}
+
+    for changed_file in changed_files:
+        if models_dir in changed_file.parents and changed_file.name == "model.yml":
+            if Path(changed_file).exists(): # it might've been deleted in the branch
+                jobs.setdefault("models", []).append(changed_file.parent.name)
+
+    git_check_attr_output = subprocess.run(
+        ["git", "check-attr", "--stdin", "-z", "--all"],
+        input=git_diff_output, stdout=subprocess.PIPE, check=True).stdout
+
+    for path, attribute, value in group_by_n(git_check_attr_output.decode()[:-1].split("\0"), 3):
+        attribute_match = RE_ATTRIB_NAME.fullmatch(attribute)
+        if value != 'unset' and attribute_match:
+            jobs[attribute_match.group(1)] = True
+
+    json.dump(jobs, sys.stdout)
+    print()
+
+if __name__ == "__main__":
+    main()
diff --git a/ci/requirements-ac-test.txt b/ci/requirements-ac-test.txt
new file mode 100644
index 00000000000..3a066c4525d
--- /dev/null
+++ b/ci/requirements-ac-test.txt
@@ -0,0 +1,31 @@
+#
+# This file is autogenerated by pip-compile
+# To update, run:
+#
+#    pip-compile --output-file=ci/requirements-ac-test.txt tools/accuracy_checker/requirements-test.in tools/accuracy_checker/requirements.in
+#
+attrs==19.3.0             # via pytest
+importlib-metadata==1.5.0  # via pluggy, pytest
+joblib==0.14.1            # via scikit-learn
+more-itertools==8.2.0     # via pytest
+nibabel==3.0.1
+numpy==1.17.5
+packaging==20.1           # via pytest
+pathlib2==2.3.5           # via pytest
+pillow==7.0.0
+pluggy==0.13.1            # via pytest
+py-cpuinfo==4.0.0
+py==1.8.1                 # via pytest
+pyparsing==2.4.6          # via packaging
+pytest-mock==2.0.0
+pytest==5.3.5
+pyyaml==5.3
+scikit-learn==0.22.1
+scipy==1.4.1
+sentencepiece==0.1.85
+shapely==1.7.0
+six==1.14.0               # via packaging, pathlib2
+tqdm==4.42.1
+wcwidth==0.1.8            # via pytest
+yamlloader==0.5.5
+zipp==1.1.0               # via importlib-metadata
diff --git a/ci/requirements-ac.txt b/ci/requirements-ac.txt
index 342f042f103..8fdbf925883 100644
--- a/ci/requirements-ac.txt
+++ b/ci/requirements-ac.txt
@@ -1,12 +1,18 @@
-joblib==0.13.2            # via scikit-learn
-nibabel==2.5.0
-numpy==1.17.0
-pillow==6.1.0
+#
+# This file is autogenerated by pip-compile
+# To update, run:
+#
+#    pip-compile --output-file=ci/requirements-ac.txt tools/accuracy_checker/requirements.in
+#
+joblib==0.14.1            # via scikit-learn
+nibabel==3.0.1
+numpy==1.17.5
+pillow==7.0.0
 py-cpuinfo==4.0.0
-pyyaml==5.1.2
-scikit-learn==0.21.3
-scipy==0.19.0
-shapely==1.6.4.post2
-six==1.12.0               # via nibabel
-tqdm==4.33.0
+pyyaml==5.3
+scikit-learn==0.22.1
+scipy==1.4.1
+sentencepiece==0.1.85
+shapely==1.7.0
+tqdm==4.42.1
 yamlloader==0.5.5
diff --git a/ci/requirements-conversion.txt b/ci/requirements-conversion.txt
index d147fcefea7..d94e3079b24 100644
--- a/ci/requirements-conversion.txt
+++ b/ci/requirements-conversion.txt
@@ -1,40 +1,40 @@
-absl-py==0.7.1            # via tensorboard, tensorflow
-astor==0.8.0              # via tensorflow
-certifi==2019.6.16        # via requests
+absl-py==0.9.0            # via tensorboard, tensorflow
+astor==0.8.1              # via tensorflow
+certifi==2019.11.28       # via requests
 chardet==3.0.4            # via requests
-decorator==4.4.0          # via networkx
+decorator==4.4.1          # via networkx
 defusedxml==0.6.0
+future==0.18.2
 gast==0.2.2               # via tensorflow
-google-pasta==0.1.7       # via tensorflow
+google-pasta==0.1.8       # via tensorflow
 graphviz==0.8.4           # via mxnet
-grpcio==1.22.0            # via tensorboard, tensorflow
-h5py==2.9.0               # via keras-applications
+grpcio==1.26.0            # via tensorboard, tensorflow
+h5py==2.10.0              # via keras-applications
 idna==2.8                 # via requests
 keras-applications==1.0.8  # via tensorflow
 keras-preprocessing==1.1.0  # via tensorflow
 markdown==3.1.1           # via tensorboard
-mxnet==1.3.1
-networkx==2.3
-numpy==1.14.6
-onnx==1.5.0
-pillow==6.1.0             # via torchvision
+mxnet==1.5.1
+networkx==2.4
+numpy==1.18.1
+onnx==1.6.0
+opt-einsum==3.1.0         # via tensorflow
+pillow==7.0.0             # via torchvision
 protobuf==3.6.1
 requests==2.22.0          # via mxnet
-scipy==1.3.1
-six==1.12.0               # via absl-py, grpcio, h5py, keras-preprocessing, onnx, protobuf, tensorboard, tensorflow, test-generator, torchvision
-tensorboard==1.14.0       # via tensorflow
-tensorflow-estimator==1.14.0  # via tensorflow
-tensorflow==1.14.0
+scipy==1.4.1
+six==1.14.0               # via absl-py, google-pasta, grpcio, h5py, keras-preprocessing, onnx, protobuf, tensorboard, tensorflow, torchvision
+tensorboard==1.15.0       # via tensorflow
+tensorflow-estimator==1.15.1  # via tensorflow
+tensorflow==1.15.2
 termcolor==1.1.0          # via tensorflow
-test-generator==0.1.1
-torch==1.2.0
-torchvision==0.4.0
-typing-extensions==3.7.4  # via onnx
-typing==3.7.4             # via onnx
-urllib3==1.25.3           # via requests
-werkzeug==0.15.5          # via tensorboard
-wheel==0.33.4             # via tensorboard, tensorflow
+torch==1.4.0
+torchvision==0.5.0
+typing-extensions==3.7.4.1  # via onnx
+urllib3==1.25.8           # via requests
+werkzeug==0.16.1          # via tensorboard
+wheel==0.34.1             # via tensorboard, tensorflow
 wrapt==1.11.2             # via tensorflow
 
 # The following packages are considered to be unsafe in a requirements file:
-# setuptools==41.0.1        # via markdown, protobuf, tensorboard
+# setuptools
diff --git a/ci/requirements-demos.txt b/ci/requirements-demos.txt
index e07312c7697..b76e094ee0f 100644
--- a/ci/requirements-demos.txt
+++ b/ci/requirements-demos.txt
@@ -1 +1,6 @@
-numpy==1.17.0 ; python_version >= "3.4"
+joblib==0.14.1            # via scikit-learn
+nibabel==3.0.1
+numpy==1.18.1 ; python_version >= "3.4"
+scikit-learn==0.22.1
+scipy==1.4.1
+tqdm==4.42.0
diff --git a/ci/requirements-downloader.txt b/ci/requirements-downloader.txt
index 3f154ea4cb8..71005e1a89a 100644
--- a/ci/requirements-downloader.txt
+++ b/ci/requirements-downloader.txt
@@ -4,9 +4,9 @@
 #
 #    pip-compile --output-file=ci/requirements-downloader.txt tools/downloader/requirements.in
 #
-certifi==2019.6.16        # via requests
+certifi==2019.11.28       # via requests
 chardet==3.0.4            # via requests
 idna==2.8                 # via requests
-pyyaml==5.1.2
+pyyaml==5.3
 requests==2.22.0
-urllib3==1.25.3           # via requests
+urllib3==1.25.8           # via requests
diff --git a/ci/update-requirements.py b/ci/update-requirements.py
new file mode 100755
index 00000000000..4009758b4d0
--- /dev/null
+++ b/ci/update-requirements.py
@@ -0,0 +1,58 @@
+#!/usr/bin/env python3
+
+"""
+This script updates all of the requirements-*.txt files in this directory
+with the most recent package versions.
+
+It uses pip-compile (https://github.com/jazzband/pip-tools), so install that
+before running it.
+"""
+
+import os
+import subprocess
+import sys
+
+from pathlib import Path
+
+# Package dependencies can vary depending on the Python version.
+# We thus have to run pip-compile with the lowest Python version that
+# the project supports.
+EXPECTED_PYTHON_VERSION = (3, 5)
+
+repo_root = Path(__file__).resolve().parent.parent
+
+def pip_compile(target, *sources):
+    print('updating {}...'.format(target), flush=True)
+
+    # Use --no-header, since the OpenVINO install path may vary between machines,
+    # so it should not be embedded in the output file. Also, this script makes
+    # the information in pip-compile's headers redundant.
+
+    subprocess.run(
+        [sys.executable, '-mpiptools', 'compile',
+            '--no-header', '--upgrade', '--quiet', '-o', target, '--', *map(str, sources)],
+        check=True, cwd=str(repo_root))
+
+def main():
+    if sys.version_info[:2] != EXPECTED_PYTHON_VERSION:
+        sys.exit("run this with Python {}".format('.'.join(map(str, EXPECTED_PYTHON_VERSION))))
+
+    if 'INTEL_OPENVINO_DIR' not in os.environ:
+        sys.exit("run OpenVINO toolkit's setupvars.sh before this")
+
+    openvino_dir = Path(os.environ['INTEL_OPENVINO_DIR'])
+
+    pip_compile('ci/requirements-ac.txt',
+        'tools/accuracy_checker/requirements.in')
+    pip_compile('ci/requirements-ac-test.txt',
+        'tools/accuracy_checker/requirements.in', 'tools/accuracy_checker/requirements-test.in')
+    pip_compile('ci/requirements-conversion.txt',
+        'tools/downloader/requirements-pytorch.in', 'tools/downloader/requirements-caffe2.in',
+        openvino_dir / 'deployment_tools/model_optimizer/requirements.txt')
+    pip_compile('ci/requirements-demos.txt',
+        'demos/python_demos/requirements.txt', openvino_dir / 'python/requirements.txt')
+    pip_compile('ci/requirements-downloader.txt',
+        'tools/downloader/requirements.in')
+
+if __name__ == '__main__':
+    main()
diff --git a/demos/CMakeLists.txt b/demos/CMakeLists.txt
index ca6633fb808..376cf916d48 100644
--- a/demos/CMakeLists.txt
+++ b/demos/CMakeLists.txt
@@ -6,6 +6,8 @@ cmake_minimum_required (VERSION 2.8.12)
 
 project(Demos)
 
+option(ENABLE_PYTHON "Whether to build extension modules for Python demos" OFF)
+
 if (CMAKE_BUILD_TYPE STREQUAL "")
     message(STATUS "CMAKE_BUILD_TYPE not defined, 'Release' will be used")
     set(CMAKE_BUILD_TYPE "Release")
@@ -97,7 +99,7 @@ if (${CMAKE_CXX_COMPILER_ID} STREQUAL GNU)
     set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall")
 endif()
 
-add_subdirectory(common/format_reader)
+add_subdirectory(common)
 
 # samples build can be switched off during whole IE build
 if (IE_MAIN_SOURCE_DIR AND NOT ENABLE_SAMPLES)
@@ -155,10 +157,6 @@ macro(ie_add_sample)
         endif()
     endif()
 
-    if(TARGET IE::ie_cpu_extension)
-        add_definitions(-DWITH_EXTENSIONS)
-    endif()
-
     # Create named folders for the sources within the .vcproj
     # Empty name lists them directly under the .vcproj
     source_group("src" FILES ${IE_SAMPLES_SOURCES})
@@ -178,10 +176,6 @@ macro(ie_add_sample)
     endif()
     target_include_directories(${IE_SAMPLE_NAME} PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}/../common")
 
-    if(TARGET IE::ie_cpu_extension)
-        target_link_libraries(${IE_SAMPLE_NAME} PRIVATE IE::ie_cpu_extension)
-    endif()
-
     target_link_libraries(${IE_SAMPLE_NAME} PRIVATE ${OpenCV_LIBRARIES} ${InferenceEngine_LIBRARIES}
                                                     ${IE_SAMPLE_DEPENDENCIES} gflags)
 
@@ -216,3 +210,10 @@ file(GLOB samples_dirs RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} *)
 # skip building of unnecessary subdirectories
 list(REMOVE_ITEM samples_dirs common thirdparty)
 add_samples_to_build(${samples_dirs})
+
+if(ENABLE_PYTHON)
+    find_package(PythonInterp 3.5 REQUIRED)
+    find_package(PythonLibs "${PYTHON_VERSION_STRING}" EXACT REQUIRED)
+
+    add_subdirectory(python_demos/human_pose_estimation_3d_demo/pose_extractor)
+endif()
diff --git a/demos/README.md b/demos/README.md
index b41a62cc6da..21f8854e23e 100644
--- a/demos/README.md
+++ b/demos/README.md
@@ -5,7 +5,9 @@ The Open Model Zoo demo applications are console applications that demonstrate h
 
 The Open Model Zoo includes the following demos:
 
+- [3D Human Pose Estimation Python* Demo](./python_demos/human_pose_estimation_3d_demo/README.md) - 3D human pose estimation demo.
 - [Action Recognition Python* Demo](./python_demos/action_recognition/README.md) - Demo application for Action Recognition algorithm, which classifies actions that are being performed on input video.
+- [Colorization Python* Demo](./python_demos/colorization_demo/README.md) - Colorization demo colorizes input frames.
 - [Crossroad Camera C++ Demo](./crossroad_camera_demo/README.md) - Person Detection followed by the Person Attributes Recognition and Person Reidentification Retail, supports images/video and camera inputs.
 - [Gaze Estimation C++ Demo](./gaze_estimation_demo/README.md) - Face detection followed by gaze estimation, head pose estimation and facial landmarks regression.
 - [Human Pose Estimation C++ Demo](./human_pose_estimation_demo/README.md) - Human pose estimation demo.
@@ -16,15 +18,18 @@ The Open Model Zoo includes the following demos:
 - [Interactive Face Recognition Python* Demo](./python_demos/face_recognition_demo/README.md) - Face Detection coupled with Head-Pose, Facial Landmarks and Face Recognition detectors. Supports video and camera inputs.
 - [Mask R-CNN C++ Demo for TensorFlow* Object Detection API](./mask_rcnn_demo/README.md) - Inference of instance segmentation networks created with TensorFlow\* Object Detection API.
 - [Multi-Camera Multi-Person Tracking Python* Demo](./python_demos/multi_camera_multi_person_tracking/README.md) Demo application for multiple persons tracking on multiple cameras.
-- [Multi-Channel Face Detection C++ Demo](./multichannel_demo/README.md) - Simultaneous Multi Camera Face Detection demo.
+- [Multi-Channel C++ Demos](./multi_channel/README.md) - Several demo applications for multi-channel scenarios.
+- [Object Detection for CenterNet Python* Demo](./python_demos/object_detection_demo_centernet/README.md) - Demo application for CenterNet object detection network.
 - [Object Detection for Faster R-CNN C++ Demo](./object_detection_demo_faster_rcnn/README.md) - Inference of object detection networks like Faster R-CNN (the demo supports only images as inputs).
 - [Object Detection for SSD C++ Demo](./object_detection_demo_ssd_async/README.md) - Demo application for SSD-based Object Detection networks, new Async API performance showcase, and simple OpenCV interoperability (supports video and camera inputs).
 - [Object Detection for YOLO V3 C++ Demo](./object_detection_demo_yolov3_async/README.md) - Demo application for YOLOV3-based Object Detection networks, new Async API performance showcase, and simple OpenCV interoperability (supports video and camera inputs).
 - [Pedestrian Tracker C++ Demo](./pedestrian_tracker_demo/README.md) - Demo application for pedestrian tracking scenario.
 - [Security Barrier Camera C++ Demo](./security_barrier_camera_demo/README.md) - Vehicle Detection followed by the Vehicle Attributes and License-Plate Recognition, supports images/video and camera inputs.
+- [Single Human Pose Estimation Python* Demo](./python_demos/single_human_pose_estimation_demo/README.md) - 2D human pose estimation demo.
 - [Smart Classroom C++ Demo](./smart_classroom_demo/README.md) - Face recognition and action detection demo for classroom environment.
 - [Super Resolution C++ Demo](./super_resolution_demo/README.md) - Super Resolution demo (the demo supports only images as inputs). It enhances the resolution of the input image.
 - [Text Detection C++ Demo](./text_detection_demo/README.md) - Text Detection demo. It detects and recognizes multi-oriented scene text on an input image and puts a bounding box around detected area.
+- [Text Spotting Python* Demo](./python_demos/text_spotting_demo/README.md) - The demo demonstrates how to run Text Spotting models.
 
 \* Several C++ demos referenced above have simplified implementation in Python*, located in the `python_demos` directory.
 
@@ -43,6 +48,7 @@ The table below shows the correlation between models, demos, and supported plugi
 
 | Model                                            | Demos supported on the model                                                                                 | CPU       | GPU       | MYRIAD/HDDL | HETERO:FPGA,CPU |
 |--------------------------------------------------|----------------------------------------------------------------------------------------------------------------|-----------|-----------|-------------|-----------------|
+| human-pose-estimation-3d-0001                    | [3D Human Pose Estimation Python* Demo](./python_demos/human_pose_estimation_3d_demo/README.md)    | Supported | Supported |             |                 |
 | action-recognition-0001-decoder                  | [Action Recognition Demo](./python_demos/action_recognition/README.md)            | Supported | Supported |             |                 |
 | action-recognition-0001-encoder                  | [Action Recognition Demo](./python_demos/action_recognition/README.md)            | Supported | Supported |             |                 |
 | driver-action-recognition-adas-0002-decoder      | [Action Recognition Demo](./python_demos/action_recognition/README.md)            | Supported | Supported |             |                 |
@@ -68,10 +74,12 @@ The table below shows the correlation between models, demos, and supported plugi
 | license-plate-recognition-barrier-0001           | [Security Barrier Camera Demo](./security_barrier_camera_demo/README.md)              | Supported | Supported | Supported   | Supported       |
 | vehicle-attributes-recognition-barrier-0039      | [Security Barrier Camera Demo](./security_barrier_camera_demo/README.md)              | Supported | Supported | Supported   | Supported       |
 | vehicle-license-plate-detection-barrier-0106     | [Security Barrier Camera Demo](./security_barrier_camera_demo/README.md)              | Supported | Supported | Supported   | Supported       |
+| vehicle-license-plate-detection-barrier-0123     | [Security Barrier Camera Demo](./security_barrier_camera_demo/README.md)              | Supported | Supported | Supported   | Supported       |
 | face-reidentification-retail-0095                | [Smart Classroom Demo](./smart_classroom_demo/README.md)<br>[Interactive Face Recognition Python* Demo](./python_demos/face_recognition_demo/README.md)                              | Supported | Supported | Supported   | Supported       |
 | landmarks-regression-retail-0009                 | [Smart Classroom Demo](./smart_classroom_demo/README.md)<br>[Interactive Face Recognition Python* Demo](./python_demos/face_recognition_demo/README.md)                              | Supported | Supported | Supported   | Supported       |
 | person-detection-action-recognition-0005         | [Smart Classroom Demo](./smart_classroom_demo/README.md)                              | Supported | Supported | Supported   | Supported       |
 | person-detection-action-recognition-teacher-0002 | [Smart Classroom Demo](./smart_classroom_demo/README.md)                              | Supported | Supported |             | Supported       |
+| single-human-pose-estimation-0001                | [Single Human Pose Estimation Python* Demo](./python_demos/single_human_pose_estimation_demo/README.md)     | Supported | Supported |
 | single-image-super-resolution-1032               | [Super Resolution Demo](./super_resolution_demo/README.md)                            | Supported | Supported |             | Supported       |
 | single-image-super-resolution-1033               | [Super Resolution Demo](./super_resolution_demo/README.md)                            | Supported | Supported |             | Supported       |
 | text-detection-0003                              | [Text Detection Demo](./text_detection_demo/README.md)                                | Supported | Supported |             | Supported       |
@@ -146,7 +154,7 @@ make
 ```
 
 For the release configuration, the demo application binaries are in `<path_to_build_directory>/intel64/Release/`;
-for the debug configuration — in `<path_to_build_directory>/intel64/Debug/`.
+for the debug configuration — in `<path_to_build_directory>/intel64/Debug/`.
 
 ### <a name="build_demos_windows"></a>Build the Demos Applications on Microsoft Windows* OS
 
@@ -155,18 +163,18 @@ The recommended Windows* build environment is the following:
 * Microsoft Visual Studio* 2015, 2017, or 2019
 * CMake* version 2.8 or higher
 
-> **NOTE**: If you want to use Microsoft Visual Studio 2019, you are required to install CMake 3.14.
+> **NOTE**: If you want to use Microsoft Visual Studio 2019, you are required to install CMake 3.14.
 
 To build the demo applications for Windows, go to the directory with the `build_demos_msvc.bat`
 batch file and run it:
-```sh
+```bat
 build_demos_msvc.bat
 ```
 
 By default, the script automatically detects the highest Microsoft Visual Studio version installed on the machine and uses it to create and build
 a solution for a demo code. Optionally, you can also specify the preffered Microsoft Visual Studio version to be used by the script. Supported
 versions are: `VS2015`, `VS2017`, `VS2019`. For example, to build the demos using the Microsoft Visual Studio 2017, use the following command:
-```sh
+```bat
 build_demos_msvc.bat VS2017
 ```
 
@@ -177,6 +185,18 @@ build binaries in Debug configuration. Run the appropriate version of the
 Microsoft Visual Studio and open the generated solution file from the `C:\Users\<username>\Documents\Intel\OpenVINO\omz_demos_build\Demos.sln`
 directory.
 
+### <a name="build_python_extensions"></a>Build the Native Python* Extension Modules
+
+Some of the Python demo applications require native Python extension modules to be built before they can be run.
+This requires you to have Python development files (headers and import libraries) installed.
+To build these modules, follow the instructions for building the demo applications above,
+but add `-DENABLE_PYTHON=ON` to either the `cmake` or the `build_demos*` command, depending on which you use.
+For example:
+
+```sh
+cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_PYTHON=ON <open_model_zoo>/demos
+```
+
 ## Get Ready for Running the Demo Applications
 
 ### Get Ready for Running the Demo Applications on Linux*
@@ -206,6 +226,14 @@ source <INSTALL_DIR>/bin/setupvars.sh
 3. Save and close the file: press the **Esc** key, type `:wq` and press the **Enter** key.
 4. To test your change, open a new terminal. You will see `[setupvars.sh] OpenVINO environment initialized`.
 
+To run Python demo applications that require native Python extension modules, you must additionally
+set up the `PYTHONPATH` environment variable as follows, where `<bin_dir>` is the directory with
+the built demo applications:
+
+```sh
+export PYTHONPATH="$PYTHONPATH:<bin_dir>/lib"
+```
+
 You are ready to run the demo applications. To learn about how to run a particular
 demo, read the demo documentation by clicking the demo name in the demo
 list above.
@@ -215,12 +243,20 @@ list above.
 Before running compiled binary files, make sure your application can find the Inference Engine and OpenCV libraries.
 If you use a [proprietary](https://software.intel.com/en-us/openvino-toolkit) distribution to build demos,
 run the `setupvars` script to set all necessary environment variables:
-```sh
+```bat
 <INSTALL_DIR>\bin\setupvars.bat
 ```
 If you use your own Inference Engine and OpenCV binaries to build the demos please make sure you have added
 to the `PATH` environment variable.
 
+To run Python demo applications that require native Python extension modules, you must additionally
+set up the `PYTHONPATH` environment variable as follows, where `<bin_dir>` is the directory with
+the built demo applications:
+
+```bat
+set PYTHONPATH=%PYTHONPATH%;<bin_dir>
+```
+
 To debug or run the demos on Windows in Microsoft Visual Studio, make sure you
 have properly configured **Debugging** environment settings for the **Debug**
 and **Release** configurations. Set correct paths to the OpenCV libraries, and
@@ -229,7 +265,7 @@ For example, for the **Debug** configuration, go to the project's
 **Configuration Properties** to the **Debugging** category and set the `PATH`
 variable in the **Environment** field to the following:
 
-```sh
+```
 PATH=<INSTALL_DIR>\deployment_tools\inference_engine\bin\intel64\Debug;<INSTALL_DIR>\opencv\bin;%PATH%
 ```
 where `<INSTALL_DIR>` is the directory in which the OpenVINO toolkit is installed.
diff --git a/demos/build_demos.sh b/demos/build_demos.sh
index 60e7d79cf0c..e13f4e03046 100755
--- a/demos/build_demos.sh
+++ b/demos/build_demos.sh
@@ -25,6 +25,20 @@ error() {
 }
 trap 'error ${LINENO}' ERR
 
+extra_cmake_opts=()
+
+for opt in "$@"; do
+    case "$opt" in
+    -DENABLE_PYTHON=*)
+        extra_cmake_opts+=("$opt")
+        ;;
+    *)
+        printf "Unknown option: %q\n" "$opt"
+        exit 1
+        ;;
+    esac
+done
+
 DEMOS_PATH="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
 
 printf "\nSetting environment variables for building demos...\n"
@@ -38,10 +52,10 @@ if [ -z "$INTEL_OPENVINO_DIR" ]; then
         printf "Error: Failed to set the environment variables automatically. To fix, run the following command:\n source <INSTALL_DIR>/bin/setupvars.sh\n where INSTALL_DIR is the OpenVINO installation directory.\n\n"
         exit 1
     fi
-    if ! source $setvars_path ; then
+    if ! source "$setvars_path"; then
         printf "Unable to run ./setupvars.sh. Please check its presence. \n\n"
-    exit 1
-fi
+        exit 1
+    fi
 else
     # case for run with `sudo -E`
     source "$INTEL_OPENVINO_DIR/bin/setupvars.sh"
@@ -57,17 +71,17 @@ build_dir=$HOME/omz_demos_build
 OS_PATH=$(uname -m)
 NUM_THREADS="-j2"
 
-if [ $OS_PATH == "x86_64" ]; then
-  OS_PATH="intel64"
-  NUM_THREADS="-j8"
+if [ "$OS_PATH" == "x86_64" ]; then
+    OS_PATH="intel64"
+    NUM_THREADS="-j8"
 fi
 
-if [ -e $build_dir/CMakeCache.txt ]; then
-    rm -rf $build_dir/CMakeCache.txt
+if [ -e "$build_dir/CMakeCache.txt" ]; then
+    rm -rf "$build_dir/CMakeCache.txt"
 fi
-mkdir -p $build_dir
-cd $build_dir
-cmake -DCMAKE_BUILD_TYPE=Release $DEMOS_PATH
-make $NUM_THREADS
+mkdir -p "$build_dir"
+
+(cd "$build_dir" && cmake -DCMAKE_BUILD_TYPE=Release "${extra_cmake_opts[@]}" "$DEMOS_PATH")
+cmake --build "$build_dir" -- "$NUM_THREADS"
 
-printf "\nBuild completed, you can find binaries for all demos in the $build_dir/${OS_PATH}/Release subfolder.\n\n"
+printf "\nBuild completed, you can find binaries for all demos in the %s subfolder.\n\n" "$build_dir/$OS_PATH/Release"
diff --git a/demos/build_demos_msvc.bat b/demos/build_demos_msvc.bat
index cc8728c9d61..6eb9737fdc6 100644
--- a/demos/build_demos_msvc.bat
+++ b/demos/build_demos_msvc.bat
@@ -15,8 +15,7 @@
 :: limitations under the License.
 
 
-@setlocal
-SETLOCAL EnableDelayedExpansion
+setlocal EnableDelayedExpansion
 set "ROOT_DIR=%~dp0"
 
 set "SOLUTION_DIR64=%USERPROFILE%\Documents\Intel\OpenVINO\omz_demos_build"
@@ -24,122 +23,141 @@ set "SOLUTION_DIR64=%USERPROFILE%\Documents\Intel\OpenVINO\omz_demos_build"
 set MSBUILD_BIN=
 set VS_PATH=
 set VS_VERSION=
+set EXTRA_CMAKE_OPTS=
 
+:argParse
 if not "%1" == "" (
-   if "%1"=="VS2015" (
-      set "VS_VERSION=2015" 
-   ) else if "%1"=="VS2017" (
-      set "VS_VERSION=2017" 
-   ) else if "%1"=="VS2019" (
-      set "VS_VERSION=2019" 
-   ) else (
-      echo Unrecognized option specified "%1"
-      echo Supported command line options: VS2015, VS2017, VS2019
-      goto errorHandling
-   )
+    rem cmd.exe mangles -DENABLE_PYTHON=YES into -DENABLE_PYTHON YES,
+    rem so it gets split into two arguments
+    if "%1" == "-DENABLE_PYTHON" (
+        set EXTRA_CMAKE_OPTS=%EXTRA_CMAKE_OPTS% %1=%2
+        shift & shift
+        goto argParse
+    )
+
+    if not "%VS_VERSION%" == "" (
+        echo Unexpected argument: "%1"
+        goto errorHandling
+    )
+
+    if "%1"=="VS2015" (
+        set "VS_VERSION=2015"
+    ) else if "%1"=="VS2017" (
+        set "VS_VERSION=2017"
+    ) else if "%1"=="VS2019" (
+        set "VS_VERSION=2019"
+    ) else (
+        echo Unrecognized Visual Studio version specified: "%1"
+        echo Supported versions: VS2015, VS2017, VS2019
+        goto errorHandling
+    )
+
+    shift
+    goto argparse
 )
 
 if "%INTEL_OPENVINO_DIR%"=="" (
     if exist "%ROOT_DIR%\..\..\bin\setupvars.bat" (
         call "%ROOT_DIR%\..\..\bin\setupvars.bat"
+    ) else if exist "%ROOT_DIR%\..\..\..\bin\setupvars.bat" (
+        call "%ROOT_DIR%\..\..\..\bin\setupvars.bat"
     ) else (
-        if exist "%ROOT_DIR%\..\..\..\bin\setupvars.bat" (
-            call "%ROOT_DIR%\..\..\..\bin\setupvars.bat"
-      ) else (
-         echo Failed to set the environment variables automatically
-         echo To fix, run the following command: ^<INSTALL_DIR^>\bin\setupvars.bat
-         echo where INSTALL_DIR is the OpenVINO installation directory.
-         GOTO errorHandling
-      )
+        echo Failed to set the environment variables automatically
+        echo To fix, run the following command: ^<INSTALL_DIR^>\bin\setupvars.bat
+        echo where INSTALL_DIR is the OpenVINO installation directory.
+        goto errorHandling
     )
-) 
+)
 
 if "%PROCESSOR_ARCHITECTURE%" == "AMD64" (
-   set "PLATFORM=x64"
+    set "PLATFORM=x64"
 ) else (
-   set "PLATFORM=Win32"
+    set "PLATFORM=Win32"
 )
 
 set VSWHERE="false"
 if exist "%ProgramFiles(x86)%\Microsoft Visual Studio\Installer\vswhere.exe" (
-   set VSWHERE="true"
-   cd "%ProgramFiles(x86)%\Microsoft Visual Studio\Installer"
+    set VSWHERE="true"
+    cd "%ProgramFiles(x86)%\Microsoft Visual Studio\Installer"
 ) else if exist "%ProgramFiles%\Microsoft Visual Studio\Installer\vswhere.exe" (
-      set VSWHERE="true"
-      cd "%ProgramFiles%\Microsoft Visual Studio\Installer"
+    set VSWHERE="true"
+    cd "%ProgramFiles%\Microsoft Visual Studio\Installer"
 ) else (
-   echo "vswhere tool is not found"
+    echo "vswhere tool is not found"
 )
 
 if !VSWHERE! == "true" (
-   if "!VS_VERSION!"=="" (
-      echo Searching the latest Visual Studio...
-      for /f "usebackq tokens=*" %%i in (`vswhere -latest -products * -requires Microsoft.Component.MSBuild -property installationPath`) do (
-         set VS_PATH=%%i
-      )
-   ) else (
-      echo Searching Visual Studio !VS_VERSION!...
-      for /f "usebackq tokens=*" %%i in (`vswhere -products * -requires Microsoft.Component.MSBuild -property installationPath`) do (
-         set CUR_VS=%%i
-         if not "!CUR_VS:%VS_VERSION%=!"=="!CUR_VS!" (
-            set VS_PATH=!CUR_VS!
-         )
-      )
-   )
-   if exist "!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe" (
-      set "MSBUILD_BIN=!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe"
-   )
-   if exist "!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe" (
-      set "MSBUILD_BIN=!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe"
-   )
-   if exist "!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe" (
-      set "MSBUILD_BIN=!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe"
-   )
+    if "!VS_VERSION!"=="" (
+        echo Searching the latest Visual Studio...
+        for /f "usebackq tokens=*" %%i in (`vswhere -latest -products * -requires Microsoft.Component.MSBuild -property installationPath`) do (
+            set VS_PATH=%%i
+        )
+    ) else (
+        echo Searching Visual Studio !VS_VERSION!...
+        for /f "usebackq tokens=*" %%i in (`vswhere -products * -requires Microsoft.Component.MSBuild -property installationPath`) do (
+            set CUR_VS=%%i
+            if not "!CUR_VS:%VS_VERSION%=!"=="!CUR_VS!" (
+                set VS_PATH=!CUR_VS!
+            )
+        )
+    )
+    if exist "!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe" (
+        set "MSBUILD_BIN=!VS_PATH!\MSBuild\14.0\Bin\MSBuild.exe"
+    )
+    if exist "!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe" (
+        set "MSBUILD_BIN=!VS_PATH!\MSBuild\15.0\Bin\MSBuild.exe"
+    )
+    if exist "!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe" (
+        set "MSBUILD_BIN=!VS_PATH!\MSBuild\Current\Bin\MSBuild.exe"
+    )
 )
 
 if "!MSBUILD_BIN!" == "" (
-   if "!VS_VERSION!"=="2015" (
-      if exist "C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe" (
-         set "MSBUILD_BIN=C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe"
-         set "MSBUILD_VERSION=14 2015"
-      )
-   ) else if "!VS_VERSION!"=="2017" (
-      if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe" (
-         set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe"
-         set "MSBUILD_VERSION=15 2017"
-      ) else if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe" (
-         set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe"
-         set "MSBUILD_VERSION=15 2017"
-      ) else if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe" (
-         set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe"
-         set "MSBUILD_VERSION=15 2017"
-      )
-   )
+    if "!VS_VERSION!"=="2015" (
+        if exist "C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe" (
+            set "MSBUILD_BIN=C:\Program Files (x86)\MSBuild\14.0\Bin\MSBuild.exe"
+            set "MSBUILD_VERSION=14 2015"
+        )
+    ) else if "!VS_VERSION!"=="2017" (
+        if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe" (
+            set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\BuildTools\MSBuild\15.0\Bin\MSBuild.exe"
+            set "MSBUILD_VERSION=15 2017"
+        ) else if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe" (
+            set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Professional\MSBuild\15.0\Bin\MSBuild.exe"
+            set "MSBUILD_VERSION=15 2017"
+        ) else if exist "C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe" (
+            set "MSBUILD_BIN=C:\Program Files (x86)\Microsoft Visual Studio\2017\Community\MSBuild\15.0\Bin\MSBuild.exe"
+            set "MSBUILD_VERSION=15 2017"
+        )
+    )
 ) else (
-   if not "!MSBUILD_BIN:2019=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=16 2019"
-   if not "!MSBUILD_BIN:2017=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=15 2017"
-   if not "!MSBUILD_BIN:2015=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=14 2015"
+    if not "!MSBUILD_BIN:2019=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=16 2019"
+    if not "!MSBUILD_BIN:2017=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=15 2017"
+    if not "!MSBUILD_BIN:2015=!"=="!MSBUILD_BIN!" set "MSBUILD_VERSION=14 2015"
 )
 
 if "!MSBUILD_BIN!" == "" (
-   echo Build tools for Microsoft Visual Studio !VS_VERSION! cannot be found. If you use Visual Studio 2017, please download and install build tools from https://www.visualstudio.com/downloads/#build-tools-for-visual-studio-2017
-   GOTO errorHandling
+    echo Build tools for Microsoft Visual Studio !VS_VERSION! cannot be found. If you use Visual Studio 2017, please download and install build tools from https://www.visualstudio.com/downloads/#build-tools-for-visual-studio-2017
+    goto errorHandling
 )
 
 if exist "%SOLUTION_DIR64%\CMakeCache.txt" del "%SOLUTION_DIR64%\CMakeCache.txt"
 
 echo Creating Visual Studio %MSBUILD_VERSION% %PLATFORM% files in %SOLUTION_DIR64%... && ^
-cd "%ROOT_DIR%" && cmake -E make_directory "%SOLUTION_DIR64%" && cd "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% "%ROOT_DIR%"
+cd "%ROOT_DIR%" && cmake -E make_directory "%SOLUTION_DIR64%"
+
+cd "%SOLUTION_DIR64%" && cmake -G "Visual Studio !MSBUILD_VERSION!" -A %PLATFORM% %EXTRA_CMAKE_OPTS% "%ROOT_DIR%"
 
 echo.
 echo ###############^|^| Build Inference Engine Demos using MS Visual Studio (MSBuild.exe) ^|^|###############
 echo.
 echo "!MSBUILD_BIN!" Demos.sln /p:Configuration=Release
 "!MSBUILD_BIN!" Demos.sln /p:Configuration=Release
-if ERRORLEVEL 1 GOTO errorHandling
+if ERRORLEVEL 1 goto errorHandling
 
 echo Done.
 goto :eof
 
 :errorHandling
 echo Error
+exit /B 1
diff --git a/demos/common/CMakeLists.txt b/demos/common/CMakeLists.txt
new file mode 100644
index 00000000000..20f29f9b051
--- /dev/null
+++ b/demos/common/CMakeLists.txt
@@ -0,0 +1,5 @@
+# Copyright (C) 2018-2019 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+add_subdirectory(monitors)
diff --git a/demos/common/format_reader/CMakeLists.txt b/demos/common/format_reader/CMakeLists.txt
deleted file mode 100644
index c4011c48a70..00000000000
--- a/demos/common/format_reader/CMakeLists.txt
+++ /dev/null
@@ -1,45 +0,0 @@
-# Copyright (C) 2018-2019 Intel Corporation
-# SPDX-License-Identifier: Apache-2.0
-#
-
-set (TARGET_NAME "format_reader")
-
-file (GLOB MAIN_SRC
-        ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp
-        )
-
-file (GLOB LIBRARY_HEADERS
-        ${CMAKE_CURRENT_SOURCE_DIR}/*.h
-        )
-
-# Find OpenCV components if exist
-find_package(OpenCV COMPONENTS imgcodecs videoio imgproc QUIET)
-if(NOT(OpenCV_FOUND))
-    message(WARNING "OPENCV is disabled or not found, " ${TARGET_NAME} " is built without OPENCV support")
-endif()
-
-# Create named folders for the sources within the .vcproj
-# Empty name lists them directly under the .vcproj
-source_group("src" FILES ${LIBRARY_SRC})
-source_group("include" FILES ${LIBRARY_HEADERS})
-
-
-# Create library file from sources.
-add_library(${TARGET_NAME} SHARED ${MAIN_SRC} ${LIBRARY_HEADERS})
-
-if(OpenCV_FOUND)
-	target_link_libraries(${TARGET_NAME} PRIVATE ${OpenCV_LIBRARIES})
-	target_compile_definitions(${TARGET_NAME} PRIVATE USE_OPENCV)
-endif()
-
-target_compile_definitions(${TARGET_NAME} PRIVATE IMPLEMENT_FORMAT_READER)
-
-target_include_directories(${TARGET_NAME} PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}"
-                                                 "${CMAKE_CURRENT_SOURCE_DIR}/..")
-
-set_target_properties(${TARGET_NAME} PROPERTIES COMPILE_PDB_NAME ${TARGET_NAME})
-
-# developer package
-
-export(TARGETS ${TARGET_NAME} NAMESPACE IE::
-       APPEND FILE "${CMAKE_BINARY_DIR}/targets_developer.cmake")
diff --git a/demos/common/format_reader/MnistUbyte.cpp b/demos/common/format_reader/MnistUbyte.cpp
deleted file mode 100644
index 6e46f0ec7b7..00000000000
--- a/demos/common/format_reader/MnistUbyte.cpp
+++ /dev/null
@@ -1,63 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <fstream>
-#include <iostream>
-#include <string>
-#include <MnistUbyte.h>
-
-using namespace FormatReader;
-
-int MnistUbyte::reverseInt(int i) {
-    unsigned char ch1, ch2, ch3, ch4;
-    ch1 = (unsigned char) (i & 255);
-    ch2 = (unsigned char) ((i >> 8) & 255);
-    ch3 = (unsigned char) ((i >> 16) & 255);
-    ch4 = (unsigned char) ((i >> 24) & 255);
-    return (static_cast<int>(ch1) << 24) + (static_cast<int>(ch2) << 16) + (static_cast<int>(ch3) << 8) + ch4;
-}
-
-MnistUbyte::MnistUbyte(const std::string &filename) {
-    std::ifstream file(filename, std::ios::binary);
-    if (!file.is_open()) {
-        return;
-    }
-    int magic_number = 0;
-    int number_of_images = 0;
-    int n_rows = 0;
-    int n_cols = 0;
-    file.read(reinterpret_cast<char *>(&magic_number), sizeof(magic_number));
-    magic_number = reverseInt(magic_number);
-    if (magic_number != 2051) {
-        return;
-    }
-    file.read(reinterpret_cast<char *>(&number_of_images), sizeof(number_of_images));
-    number_of_images = reverseInt(number_of_images);
-    file.read(reinterpret_cast<char *>(&n_rows), sizeof(n_rows));
-    n_rows = reverseInt(n_rows);
-    _height = (size_t) n_rows;
-    file.read(reinterpret_cast<char *>(&n_cols), sizeof(n_cols));
-    n_cols = reverseInt(n_cols);
-    _width = (size_t) n_cols;
-    if (number_of_images > 1) {
-        std::cout << "[MNIST] Warning: number_of_images  in mnist file equals " << number_of_images
-                  << ". Only a first image will be read." << std::endl;
-    }
-
-    size_t size = _width * _height * 1;
-
-    _data.reset(new unsigned char[size], std::default_delete<unsigned char[]>());
-    size_t count = 0;
-    if (0 < number_of_images) {
-        for (int r = 0; r < n_rows; ++r) {
-            for (int c = 0; c < n_cols; ++c) {
-                unsigned char temp = 0;
-                file.read(reinterpret_cast<char *>(&temp), sizeof(temp));
-                _data.get()[count++] = temp;
-            }
-        }
-    }
-
-    file.close();
-}
diff --git a/demos/common/format_reader/MnistUbyte.h b/demos/common/format_reader/MnistUbyte.h
deleted file mode 100644
index fd6ae0f75e8..00000000000
--- a/demos/common/format_reader/MnistUbyte.h
+++ /dev/null
@@ -1,58 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * \brief Mnist reader
- * \file MnistUbyte.h
- */
-#pragma once
-
-#include <memory>
-#include <string>
-#include <format_reader.h>
-
-#include "register.h"
-
-namespace FormatReader {
-/**
- * \class MnistUbyte
- * \brief Reader for mnist db files
- */
-class MnistUbyte : public Reader {
-private:
-    int reverseInt(int i);
-
-    static Register<MnistUbyte> reg;
-
-public:
-    /**
-     * \brief Constructor of Mnist reader
-     * @param filename - path to input data
-     * @return MnistUbyte reader object
-     */
-    explicit MnistUbyte(const std::string &filename);
-    virtual ~MnistUbyte() {
-    }
-
-    /**
-     * \brief Get size
-     * @return size
-     */
-    size_t size() const override {
-        return _width * _height * 1;
-    }
-
-    void Release() noexcept override {
-        delete this;
-    }
-
-    std::shared_ptr<unsigned char> getData(size_t width, size_t height) override {
-        if ((width * height != 0) && (_width * _height != width * height)) {
-            std::cout << "[ WARNING ] Image won't be resized! Please use OpenCV.\n";
-            return nullptr;
-        }
-        return _data;
-    }
-};
-}  // namespace FormatReader
diff --git a/demos/common/format_reader/bmp.cpp b/demos/common/format_reader/bmp.cpp
deleted file mode 100644
index b52f839abcb..00000000000
--- a/demos/common/format_reader/bmp.cpp
+++ /dev/null
@@ -1,63 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "bmp.h"
-#include <fstream>
-#include <iostream>
-
-using namespace std;
-using namespace FormatReader;
-
-
-BitMap::BitMap(const string &filename) {
-    BmpHeader header;
-    BmpInfoHeader infoHeader;
-
-    ifstream input(filename, ios::binary);
-    if (!input) {
-        return;
-    }
-
-    input.read(reinterpret_cast<char *>(&header.type), 2);
-
-    if (header.type != 'M'*256+'B') {
-        std::cerr << "[BMP] file is not bmp type\n";
-        return;
-    }
-
-    input.read(reinterpret_cast<char *>(&header.size), 4);
-    input.read(reinterpret_cast<char *>(&header.reserved), 4);
-    input.read(reinterpret_cast<char *>(&header.offset), 4);
-
-    input.read(reinterpret_cast<char *>(&infoHeader), sizeof(BmpInfoHeader));
-
-
-    bool rowsReversed = infoHeader.height < 0;
-    _width = infoHeader.width;
-    _height = abs(infoHeader.height);
-
-    if (infoHeader.bits != 24) {
-        cerr << "[BMP] 24bpp only supported. But input has:" << infoHeader.bits << "\n";
-        return;
-    }
-
-    if (infoHeader.compression != 0) {
-        cerr << "[BMP] compression not supported\n";
-    }
-
-    int padSize = _width & 3;
-    char pad[3];
-    size_t size = _width * _height * 3;
-
-    _data.reset(new unsigned char[size], std::default_delete<unsigned char[]>());
-
-    input.seekg(header.offset, ios::beg);
-
-    // reading by rows in invert vertically
-    for (uint32_t i = 0; i < _height; i++) {
-        uint32_t storeAt = rowsReversed ? i : (uint32_t)_height - 1 - i;
-        input.read(reinterpret_cast<char *>(_data.get()) + _width * 3 * storeAt, _width * 3);
-        input.read(pad, padSize);
-    }
-}
diff --git a/demos/common/format_reader/bmp.h b/demos/common/format_reader/bmp.h
deleted file mode 100644
index b1b05dfc249..00000000000
--- a/demos/common/format_reader/bmp.h
+++ /dev/null
@@ -1,75 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * \brief BMP reader
- * \file bmp.h
- */
-#pragma once
-
-#include <memory>
-#include <string>
-#include <format_reader.h>
-
-#include "register.h"
-
-namespace FormatReader {
-/**
- * \class BitMap
- * \brief Reader for bmp files
- */
-class BitMap : public Reader {
-private:
-    static Register<BitMap> reg;
-
-    typedef struct {
-        unsigned short type   = 0u;              /* Magic identifier            */
-        unsigned int size     = 0u;              /* File size in bytes          */
-        unsigned int reserved = 0u;
-        unsigned int offset   = 0u;              /* Offset to image data, bytes */
-    } BmpHeader;
-
-    typedef struct {
-        unsigned int size = 0u;                  /* Header size in bytes      */
-        int width = 0, height = 0;               /* Width and height of image */
-        unsigned short planes = 0u;              /* Number of colour planes   */
-        unsigned short bits = 0u;                /* Bits per pixel            */
-        unsigned int compression = 0u;           /* Compression type          */
-        unsigned int imagesize = 0u;             /* Image size in bytes       */
-        int xresolution = 0, yresolution = 0;    /* Pixels per meter          */
-        unsigned int ncolours = 0u;              /* Number of colours         */
-        unsigned int importantcolours = 0u;      /* Important colours         */
-    } BmpInfoHeader;
-
-public:
-    /**
-     * \brief Constructor of BMP reader
-     * @param filename - path to input data
-     * @return BitMap reader object
-     */
-    explicit BitMap(const std::string &filename);
-    virtual ~BitMap() {
-    }
-
-    /**
-     * \brief Get size
-     * @return size
-     */
-    size_t size() const override {
-        return _width * _height * 3;
-    }
-
-    void Release() noexcept override {
-        delete this;
-    }
-
-    std::shared_ptr<unsigned char> getData(size_t width, size_t height) override {
-        if ((width * height != 0) && (_width * _height != width * height)) {
-            std::cout << "[ WARNING ] Image won't be resized! Please use OpenCV.\n";
-            return nullptr;
-        }
-        return _data;
-    }
-};
-}  // namespace FormatReader
diff --git a/demos/common/format_reader/format_reader.cpp b/demos/common/format_reader/format_reader.cpp
deleted file mode 100644
index 30f33453216..00000000000
--- a/demos/common/format_reader/format_reader.cpp
+++ /dev/null
@@ -1,37 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <iostream>
-#include <format_reader.h>
-#include "bmp.h"
-#include "MnistUbyte.h"
-#include "opencv_wraper.h"
-
-using namespace FormatReader;
-
-std::vector<Registry::CreatorFunction> Registry::_data;
-
-Register<MnistUbyte> MnistUbyte::reg;
-#ifdef USE_OPENCV
-Register<OCVReader> OCVReader::reg;
-#else
-Register<BitMap> BitMap::reg;
-#endif
-
-Reader *Registry::CreateReader(const char *filename) {
-    for (auto maker : _data) {
-        Reader *ol = maker(filename);
-        if (ol != nullptr && ol->size() != 0) return ol;
-        if (ol != nullptr) ol->Release();
-    }
-    return nullptr;
-}
-
-void Registry::RegisterReader(CreatorFunction f) {
-    _data.push_back(f);
-}
-
-FORMAT_READER_API(Reader*) CreateFormatReader(const char *filename) {
-    return Registry::CreateReader(filename);
-}
\ No newline at end of file
diff --git a/demos/common/format_reader/format_reader.h b/demos/common/format_reader/format_reader.h
deleted file mode 100644
index d0c746275b7..00000000000
--- a/demos/common/format_reader/format_reader.h
+++ /dev/null
@@ -1,81 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * \brief Format reader abstract class implementation
- * \file format_reader.h
- */
-#pragma once
-
-#include <memory>
-#include <string>
-#include <vector>
-#include <iostream>
-
-#if defined(_WIN32)
-# ifdef IMPLEMENT_FORMAT_READER
-# define FORMAT_READER_API(type) extern "C"   __declspec(dllexport) type
-# else
-# define FORMAT_READER_API(type) extern "C" type
-# endif
-#elif(__GNUC__ >= 4)
-# ifdef IMPLEMENT_FORMAT_READER
-#  define FORMAT_READER_API(type) extern "C"   __attribute__((visibility("default"))) type
-# else
-#  define FORMAT_READER_API(type) extern "C" type
-# endif
-#else
-# define FORMAT_READER_API(TYPE) extern "C" TYPE
-#endif
-
-
-namespace FormatReader {
-/**
- * \class FormatReader
- * \brief This is an abstract class for reading input data
- */
-class Reader {
-protected:
-    /// \brief height
-    size_t _height = 0;
-    /// \brief width
-    size_t _width = 0;
-    /// \brief data
-    std::shared_ptr<unsigned char> _data;
-
-public:
-    /**
-     * \brief Get width
-     * @return width
-     */
-    size_t width() const { return _width; }
-
-    /**
-     * \brief Get height
-     * @return height
-     */
-    size_t height() const { return _height; }
-
-    /**
-     * \brief Get input data ptr
-     * @return shared pointer with input data
-     * @In case of using OpenCV, parameters width and height will be used for image resizing
-     */
-    virtual std::shared_ptr<unsigned char> getData(size_t width = 0, size_t height = 0) = 0;
-
-    /**
-     * \brief Get size
-     * @return size
-     */
-    virtual size_t size() const = 0;
-
-    virtual void Release() noexcept = 0;
-};
-}  // namespace FormatReader
-
-/**
- * \brief Function for create reader
- * @return FormatReader pointer
- */
-FORMAT_READER_API(FormatReader::Reader*) CreateFormatReader(const char *filename);
\ No newline at end of file
diff --git a/demos/common/format_reader/format_reader_ptr.h b/demos/common/format_reader/format_reader_ptr.h
deleted file mode 100644
index 0b82d467457..00000000000
--- a/demos/common/format_reader/format_reader_ptr.h
+++ /dev/null
@@ -1,45 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * \brief Implementation of smart pointer for Reader class
- * \file format_reader_ptr.h
- */
-#pragma once
-
-#include "format_reader.h"
-#include <functional>
-#include <memory>
-
-namespace FormatReader {
-class ReaderPtr {
-public:
-    explicit ReaderPtr(const char *imageName) : reader(CreateFormatReader(imageName),
-                                                [](Reader *p) {
-                                                p->Release();
-                                           }) {}
-    /**
-     * @brief dereference operator overload
-     * @return Reader
-     */
-    Reader *operator->() const noexcept {
-        return reader.get();
-    }
-
-    /**
-     * @brief dereference operator overload
-     * @return Reader
-     */
-    Reader *operator*() const noexcept {
-        return reader.get();
-    }
-
-    Reader *get() {
-        return reader.get();
-    }
-
-protected:
-    std::unique_ptr<Reader, std::function<void(Reader *)>> reader;
-};
-}  // namespace FormatReader
diff --git a/demos/common/format_reader/opencv_wraper.cpp b/demos/common/format_reader/opencv_wraper.cpp
deleted file mode 100644
index 835402ab6a7..00000000000
--- a/demos/common/format_reader/opencv_wraper.cpp
+++ /dev/null
@@ -1,48 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#ifdef USE_OPENCV
-#include "opencv_wraper.h"
-#include <fstream>
-#include <iostream>
-
-#include <opencv2/opencv.hpp>
-
-#include <samples/slog.hpp>
-
-using namespace std;
-using namespace FormatReader;
-
-OCVReader::OCVReader(const string &filename) {
-    img = cv::imread(filename);
-    _size = 0;
-
-    if (img.empty()) {
-        return;
-    }
-
-    _size   = img.size().width * img.size().height * img.channels();
-    _width  = img.size().width;
-    _height = img.size().height;
-}
-
-std::shared_ptr<unsigned char> OCVReader::getData(size_t width = 0, size_t height = 0) {
-    cv::Mat resized(img);
-    if (width != 0 && height != 0) {
-        size_t iw = img.size().width;
-        size_t ih = img.size().height;
-        if (width != iw || height != ih) {
-            slog::warn << "Image is resized from (" << iw << ", " << ih << ") to (" << width << ", " << height << ")" << slog::endl;
-        }
-        cv::resize(img, resized, cv::Size(width, height));
-    }
-
-    size_t size = resized.size().width * resized.size().height * resized.channels();
-    _data.reset(new unsigned char[size], std::default_delete<unsigned char[]>());
-    for (size_t id = 0; id < size; ++id) {
-        _data.get()[id] = resized.data[id];
-    }
-    return _data;
-}
-#endif
diff --git a/demos/common/format_reader/opencv_wraper.h b/demos/common/format_reader/opencv_wraper.h
deleted file mode 100644
index 5dc0b12f4da..00000000000
--- a/demos/common/format_reader/opencv_wraper.h
+++ /dev/null
@@ -1,56 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * \brief Image reader
- * \file opencv_wraper.h
- */
-#pragma once
-
-#ifdef USE_OPENCV
-#include <memory>
-#include <string>
-#include <format_reader.h>
-
-#include <opencv2/opencv.hpp>
-
-#include "register.h"
-
-namespace FormatReader {
-/**
- * \class OCVMAT
- * \brief OpenCV Wraper
- */
-class OCVReader : public Reader {
-private:
-    cv::Mat img;
-    size_t _size;
-    static Register<OCVReader> reg;
-
-public:
-    /**
-    * \brief Constructor of BMP reader
-    * @param filename - path to input data
-    * @return BitMap reader object
-    */
-    explicit OCVReader(const std::string &filename);
-    virtual ~OCVReader() {
-    }
-
-    /**
-    * \brief Get size
-    * @return size
-    */
-    size_t size() const override {
-        return _size;
-    }
-
-    void Release() noexcept override {
-        delete this;
-    }
-
-    std::shared_ptr<unsigned char> getData(size_t width, size_t height) override;
-};
-}  // namespace FormatReader
-#endif
\ No newline at end of file
diff --git a/demos/common/format_reader/register.h b/demos/common/format_reader/register.h
deleted file mode 100644
index 34cf1f77f20..00000000000
--- a/demos/common/format_reader/register.h
+++ /dev/null
@@ -1,56 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-/**
- * \brief Register for readers
- * \file register.h
- */
-#pragma once
-
-#include <format_reader.h>
-#include <functional>
-#include <vector>
-#include <string>
-
-namespace FormatReader {
-/**
- * \class Registry
- * \brief Create reader from fabric
- */
-class Registry {
-private:
-    typedef std::function<Reader *(const std::string &filename)> CreatorFunction;
-    static std::vector<CreatorFunction> _data;
-public:
-    /**
-     * \brief Create reader
-     * @param filename - path to input data
-     * @return Reader for input data or nullptr
-     */
-    static Reader *CreateReader(const char *filename);
-
-    /**
-     * \brief Registers reader in fabric
-     * @param f - a creation function
-     */
-    static void RegisterReader(CreatorFunction f);
-};
-
-/**
- * \class Register
- * \brief Registers reader in fabric
- */
-template<typename To>
-class Register {
-public:
-    /**
-     * \brief Constructor creates creation function for fabric
-     * @return Register object
-     */
-    Register() {
-        Registry::RegisterReader([](const std::string &filename) -> Reader * {
-            return new To(filename);
-        });
-    }
-};
-}  // namespace FormatReader
\ No newline at end of file
diff --git a/demos/common/monitors/CMakeLists.txt b/demos/common/monitors/CMakeLists.txt
new file mode 100644
index 00000000000..df429408a13
--- /dev/null
+++ b/demos/common/monitors/CMakeLists.txt
@@ -0,0 +1,23 @@
+# Copyright (C) 2018-2019 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+find_package(OpenCV REQUIRED COMPONENTS core imgproc)
+
+set(SOURCES presenter.cpp cpu_monitor.cpp memory_monitor.cpp)
+set(HEADERS presenter.h cpu_monitor.h memory_monitor.h)
+if(WIN32)
+    list(APPEND SOURCES query_wrapper.cpp)
+    list(APPEND HEADERS query_wrapper.h)
+endif()
+# Create named folders for the sources within the .vcproj
+# Empty name lists them directly under the .vcproj
+source_group("src" FILES ${SOURCES})
+source_group("include" FILES ${HEADERS})
+
+add_library(monitors STATIC ${SOURCES} ${HEADERS})
+target_include_directories(monitors PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}")
+target_link_libraries(monitors PRIVATE opencv_core opencv_imgproc)
+if(WIN32)
+    target_link_libraries(monitors PRIVATE pdh)
+endif()
diff --git a/demos/common/monitors/cpu_monitor.cpp b/demos/common/monitors/cpu_monitor.cpp
new file mode 100644
index 00000000000..00a841287dd
--- /dev/null
+++ b/demos/common/monitors/cpu_monitor.cpp
@@ -0,0 +1,199 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "cpu_monitor.h"
+#include <algorithm>
+#ifdef _WIN32
+#include "query_wrapper.h"
+#include <string>
+#include <system_error>
+#include <pdhmsg.h>
+#include <windows.h>
+
+namespace {
+const std::size_t nCores = []() {
+        SYSTEM_INFO sysinfo;
+        GetSystemInfo(&sysinfo);
+        return sysinfo.dwNumberOfProcessors;
+    }();
+}
+
+class CpuMonitor::PerformanceCounter {
+public:
+    PerformanceCounter() : coreTimeCounters(nCores) {
+        PDH_STATUS status;
+        for (std::size_t i = 0; i < nCores; ++i) {
+            std::wstring fullCounterPath{L"\\Processor(" + std::to_wstring(i) + L")\\% Processor Time"};
+            status = PdhAddCounterW(query, fullCounterPath.c_str(), 0, &coreTimeCounters[i]);
+            if (ERROR_SUCCESS != status) {
+                throw std::system_error(status, std::system_category(), "PdhAddCounterW() failed");
+            }
+            status = PdhSetCounterScaleFactor(coreTimeCounters[i], -2); // scale counter to [0, 1]
+            if (ERROR_SUCCESS != status) {
+                throw std::system_error(status, std::system_category(), "PdhSetCounterScaleFactor() failed");
+            }
+        }
+        status = PdhCollectQueryData(query);
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhCollectQueryData() failed");
+        }
+    }
+
+    std::vector<double> getCpuLoad() {
+        PDH_STATUS status;
+        status = PdhCollectQueryData(query);
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhCollectQueryData() failed");
+        }
+
+        PDH_FMT_COUNTERVALUE displayValue;
+        std::vector<double> cpuLoad(coreTimeCounters.size());
+        for (std::size_t i = 0; i < coreTimeCounters.size(); ++i) {
+            status = PdhGetFormattedCounterValue(coreTimeCounters[i], PDH_FMT_DOUBLE, NULL,
+                &displayValue);
+            if (ERROR_SUCCESS != status) {
+                throw std::system_error(status, std::system_category(), "PdhGetFormattedCounterValue() failed");
+            }
+            if (PDH_CSTATUS_VALID_DATA != displayValue.CStatus && PDH_CSTATUS_NEW_DATA != displayValue.CStatus) {
+                throw std::runtime_error("Error in counter data");
+            }
+
+            cpuLoad[i] = displayValue.doubleValue;
+        }
+        return cpuLoad;
+    }
+
+private:
+    QueryWrapper query;
+    std::vector<PDH_HCOUNTER> coreTimeCounters;
+};
+
+#elif __linux__
+#include <chrono>
+#include <regex>
+#include <utility>
+#include <fstream>
+#include <unistd.h>
+
+namespace {
+const long clockTicks = sysconf(_SC_CLK_TCK);
+
+const std::size_t nCores = sysconf(_SC_NPROCESSORS_CONF);
+
+std::vector<unsigned long> getIdleCpuStat() {
+    std::vector<unsigned long> idleCpuStat(nCores);
+    std::ifstream procStat("/proc/stat");
+    std::string line;
+    std::smatch match;
+    std::regex coreJiffies("^cpu(\\d+)\\s+"
+        "(\\d+)\\s+"
+        "(\\d+)\\s+"
+        "(\\d+)\\s+"
+        "(\\d+)\\s+" // idle
+        "(\\d+)"); // iowait
+
+    while (std::getline(procStat, line)) {
+        if (std::regex_search(line, match, coreJiffies)) {
+            // it doesn't handle overflow of sum and overflows of /proc/stat values
+            unsigned long idleInfo = stoul(match[5]) + stoul(match[6]),
+                coreId = stoul(match[1]);
+            if (nCores <= coreId) {
+                throw std::runtime_error("The number of cores has changed");
+            }
+            idleCpuStat[coreId] = idleInfo;
+        }
+    }
+    return idleCpuStat;
+}
+}
+
+class CpuMonitor::PerformanceCounter {
+public:
+    PerformanceCounter() : prevIdleCpuStat{getIdleCpuStat()}, prevTimePoint{std::chrono::steady_clock::now()} {}
+
+    std::vector<double> getCpuLoad() {
+        std::vector<unsigned long> idleCpuStat = getIdleCpuStat();
+        auto timePoint = std::chrono::steady_clock::now();
+        // don't update data too frequently which may result in negative values for cpuLoad.
+        // It may happen when collectData() is called just after setHistorySize().
+        if (timePoint - prevTimePoint > std::chrono::milliseconds{100}) {
+            std::vector<double> cpuLoad(nCores);
+            for (std::size_t i = 0; i < idleCpuStat.size(); ++i) {
+                double idleDiff = idleCpuStat[i] - prevIdleCpuStat[i];
+                typedef std::chrono::duration<double, std::chrono::seconds::period> Sec;
+                cpuLoad[i] = 1.0
+                    - idleDiff / clockTicks / std::chrono::duration_cast<Sec>(timePoint - prevTimePoint).count();
+            }
+            return cpuLoad;
+        }
+        return {};
+    }
+private:
+    std::vector<unsigned long> prevIdleCpuStat;
+    std::chrono::steady_clock::time_point prevTimePoint;
+};
+
+#else
+// not implemented
+namespace {
+const std::size_t nCores{0};
+}
+
+class CpuMonitor::PerformanceCounter {
+public:
+    std::vector<double> getCpuLoad() {return {};};
+};
+#endif
+
+CpuMonitor::CpuMonitor() :
+    samplesNumber{0},
+    historySize{0},
+    cpuLoadSum(nCores, 0) {}
+
+// PerformanceCounter is incomplete in header and destructor can't be defined implicitly
+CpuMonitor::~CpuMonitor() = default;
+
+void CpuMonitor::setHistorySize(std::size_t size) {
+    if (0 == historySize && 0 != size) {
+        performanceCounter.reset(new PerformanceCounter);
+    } else if (0 != historySize && 0 == size) {
+        performanceCounter.reset();
+    }
+    historySize = size;
+    std::size_t newSize = std::min(size, cpuLoadHistory.size());
+    cpuLoadHistory.erase(cpuLoadHistory.begin(), cpuLoadHistory.end() - newSize);
+}
+
+void CpuMonitor::collectData() {
+    std::vector<double> cpuLoad = performanceCounter->getCpuLoad();
+
+    if (!cpuLoad.empty()) {
+        for (std::size_t i = 0; i < cpuLoad.size(); ++i) {
+            cpuLoadSum[i] += cpuLoad[i];
+        }
+        ++samplesNumber;
+
+        cpuLoadHistory.push_back(std::move(cpuLoad));
+        if (cpuLoadHistory.size() > historySize) {
+            cpuLoadHistory.pop_front();
+        }
+    }
+}
+
+std::size_t CpuMonitor::getHistorySize() const {
+    return historySize;
+}
+
+std::deque<std::vector<double>> CpuMonitor::getLastHistory() const {
+    return cpuLoadHistory;
+}
+
+std::vector<double> CpuMonitor::getMeanCpuLoad() const {
+    std::vector<double> meanCpuLoad;
+    meanCpuLoad.reserve(cpuLoadSum.size());
+    for (double coreLoad : cpuLoadSum) {
+        meanCpuLoad.push_back(coreLoad / samplesNumber);
+    }
+    return meanCpuLoad;
+}
diff --git a/demos/common/monitors/cpu_monitor.h b/demos/common/monitors/cpu_monitor.h
new file mode 100644
index 00000000000..38d284538e4
--- /dev/null
+++ b/demos/common/monitors/cpu_monitor.h
@@ -0,0 +1,28 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <deque>
+#include <memory>
+#include <vector>
+
+class CpuMonitor {
+public:
+    CpuMonitor();
+    ~CpuMonitor();
+    void setHistorySize(std::size_t size);
+    std::size_t getHistorySize() const;
+    void collectData();
+    std::deque<std::vector<double>> getLastHistory() const;
+    std::vector<double> getMeanCpuLoad() const;
+
+private:
+    unsigned samplesNumber;
+    unsigned historySize;
+    std::vector<double> cpuLoadSum;
+    std::deque<std::vector<double>> cpuLoadHistory;
+    class PerformanceCounter;
+    std::unique_ptr<PerformanceCounter> performanceCounter;
+};
diff --git a/demos/common/monitors/memory_monitor.cpp b/demos/common/monitors/memory_monitor.cpp
new file mode 100644
index 00000000000..74019b46d37
--- /dev/null
+++ b/demos/common/monitors/memory_monitor.cpp
@@ -0,0 +1,208 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "memory_monitor.h"
+
+struct MemState {
+    double memTotal, usedMem, usedSwap;
+};
+
+#ifdef _WIN32
+#include "query_wrapper.h"
+#include <algorithm>
+#define PSAPI_VERSION 2
+#include <system_error>
+#include <windows.h>
+#include <pdhmsg.h>
+#include <psapi.h>
+
+namespace {
+double getMemTotal() {
+    PERFORMANCE_INFORMATION performanceInformation;
+    if (!GetPerformanceInfo(&performanceInformation, sizeof(performanceInformation))) {
+        throw std::runtime_error("GetPerformanceInfo() failed");
+    }
+    return static_cast<double>(performanceInformation.PhysicalTotal * performanceInformation.PageSize)
+        / (1024 * 1024 * 1024);
+}
+}
+
+class MemoryMonitor::PerformanceCounter {
+public:
+    PerformanceCounter() {
+        PDH_STATUS status = PdhAddCounterW(query, L"\\Paging File(_Total)\\% Usage", 0, &pagingFileUsageCounter);
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhAddCounterW() failed");
+        }
+        status = PdhSetCounterScaleFactor(pagingFileUsageCounter, -2); // scale counter to [0, 1]
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhSetCounterScaleFactor() failed");
+        }
+    }
+
+    MemState getMemState() {
+        PERFORMANCE_INFORMATION performanceInformation;
+        if (!GetPerformanceInfo(&performanceInformation, sizeof(performanceInformation))) {
+            throw std::runtime_error("GetPerformanceInfo() failed");
+        }
+
+        PDH_STATUS status;
+        status = PdhCollectQueryData(query);
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhCollectQueryData() failed");
+        }
+        PDH_FMT_COUNTERVALUE displayValue;
+        status = PdhGetFormattedCounterValue(pagingFileUsageCounter, PDH_FMT_DOUBLE, NULL, &displayValue);
+        if (ERROR_SUCCESS != status) {
+            throw std::system_error(status, std::system_category(), "PdhGetFormattedCounterValue() failed");
+        }
+        if (PDH_CSTATUS_VALID_DATA != displayValue.CStatus && PDH_CSTATUS_NEW_DATA != displayValue.CStatus) {
+            throw std::runtime_error("Error in counter data");
+        }
+
+        double pagingFilesSize = static_cast<double>(
+            (performanceInformation.CommitLimit - performanceInformation.PhysicalTotal)
+            * performanceInformation.PageSize) / (1024 * 1024 * 1024);
+        return {static_cast<double>(performanceInformation.PhysicalTotal * performanceInformation.PageSize)
+                / (1024 * 1024 * 1024),
+            static_cast<double>(
+                (performanceInformation.PhysicalTotal - performanceInformation.PhysicalAvailable)
+                * performanceInformation.PageSize) / (1024 * 1024 * 1024),
+            pagingFilesSize * displayValue.doubleValue};
+    }
+private:
+    QueryWrapper query;
+    PDH_HCOUNTER pagingFileUsageCounter;
+};
+
+#elif __linux__
+#include <fstream>
+#include <utility>
+#include <vector>
+#include <regex>
+
+namespace {
+std::pair<std::pair<double, double>, std::pair<double, double>> getAvailableMemSwapTotalMemSwap() {
+    double memAvailable = 0, swapFree = 0, memTotal = 0, swapTotal = 0;
+    std::regex memRegex("^(.+):\\s+(\\d+) kB$");
+    std::string line;
+    std::smatch match;
+    std::ifstream meminfo("/proc/meminfo");
+    while (std::getline(meminfo, line)) {
+        if (std::regex_match(line, match, memRegex)) {
+            if ("MemAvailable" == match[1]) {
+                memAvailable = stod(match[2]) / (1024 * 1024);
+            } else if ("SwapFree" == match[1]) {
+                swapFree = stod(match[2]) / (1024 * 1024);
+            } else if ("MemTotal" == match[1]) {
+                memTotal = stod(match[2]) / (1024 * 1024);
+            } else if ("SwapTotal" == match[1]) {
+                swapTotal = stod(match[2]) / (1024 * 1024);
+            }
+        }
+    }
+    if (0 == memTotal) {
+        throw std::runtime_error("Can't get MemTotal");
+    }
+    return {{memAvailable, swapFree}, {memTotal, swapTotal}};
+}
+
+double getMemTotal() {
+    return getAvailableMemSwapTotalMemSwap().second.first;
+}
+}
+
+class MemoryMonitor::PerformanceCounter {
+public:
+    MemState getMemState() {
+        std::pair<std::pair<double, double>, std::pair<double, double>> availableMemSwapTotalMemSwap
+            = getAvailableMemSwapTotalMemSwap();
+        double memTotal = availableMemSwapTotalMemSwap.second.first;
+        double swapTotal = availableMemSwapTotalMemSwap.second.second;
+        return {memTotal, memTotal - availableMemSwapTotalMemSwap.first.first, swapTotal - availableMemSwapTotalMemSwap.first.second};
+    }
+};
+
+#else
+// not implemented
+namespace {
+double getMemTotal() {return 0.0;}
+}
+
+class MemoryMonitor::PerformanceCounter {
+public:
+    MemState getMemState() {return {0.0, 0.0, 0.0};}
+};
+#endif
+
+MemoryMonitor::MemoryMonitor() :
+    samplesNumber{0},
+    historySize{0},
+    memSum{0.0},
+    swapSum{0.0},
+    maxMem{0.0},
+    maxSwap{0.0},
+    memTotal{::getMemTotal()},
+    maxMemTotal{memTotal} {}
+
+// PerformanceCounter is incomplete in header and destructor can't be defined implicitly
+MemoryMonitor::~MemoryMonitor() = default;
+
+void MemoryMonitor::setHistorySize(std::size_t size) {
+    if (0 == historySize && 0 != size) {
+        performanceCounter.reset(new MemoryMonitor::PerformanceCounter);
+    } else if (0 != historySize && 0 == size) {
+        performanceCounter.reset();
+    }
+    historySize = size;
+    std::size_t newSize = std::min(size, memSwapUsageHistory.size());
+    memSwapUsageHistory.erase(memSwapUsageHistory.begin(), memSwapUsageHistory.end() - newSize);
+}
+
+void MemoryMonitor::collectData() {
+    MemState memState = performanceCounter->getMemState();
+    maxMemTotal = std::max(maxMemTotal, memState.memTotal);
+    memSum += memState.usedMem;
+    swapSum += memState.usedSwap;
+    ++samplesNumber;
+    maxMem = std::max(maxMem, memState.usedMem);
+    maxSwap = std::max(maxSwap, memState.usedSwap);
+
+    memSwapUsageHistory.emplace_back(memState.usedMem, memState.usedSwap);
+    if (memSwapUsageHistory.size() > historySize) {
+        memSwapUsageHistory.pop_front();
+    }
+}
+
+std::size_t MemoryMonitor::getHistorySize() const {
+    return historySize;
+}
+
+std::deque<std::pair<double, double>> MemoryMonitor::getLastHistory() const {
+    return memSwapUsageHistory;
+}
+
+double MemoryMonitor::getMeanMem() const {
+    return memSum / samplesNumber;
+}
+
+double MemoryMonitor::getMeanSwap() const {
+    return swapSum / samplesNumber;
+}
+
+double MemoryMonitor::getMaxMem() const {
+    return maxMem;
+}
+
+double MemoryMonitor::getMaxSwap() const {
+    return maxSwap;
+}
+
+double MemoryMonitor::getMemTotal() const {
+    return memTotal;
+}
+
+double MemoryMonitor::getMaxMemTotal() const {
+    return maxMemTotal;
+}
diff --git a/demos/common/monitors/memory_monitor.h b/demos/common/monitors/memory_monitor.h
new file mode 100644
index 00000000000..9eda10f7559
--- /dev/null
+++ b/demos/common/monitors/memory_monitor.h
@@ -0,0 +1,34 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <deque>
+#include <memory>
+
+class MemoryMonitor {
+public:
+    MemoryMonitor();
+    ~MemoryMonitor();
+    void setHistorySize(std::size_t size);
+    std::size_t getHistorySize() const;
+    void collectData();
+    std::deque<std::pair<double, double>> getLastHistory() const;
+    double getMeanMem() const; // in GiB
+    double getMeanSwap() const;
+    double getMaxMem() const;
+    double getMaxSwap() const;
+    double getMemTotal() const;
+    double getMaxMemTotal() const; // a system may have hotpluggable memory
+private:
+    unsigned samplesNumber;
+    std::size_t historySize;
+    double memSum, swapSum;
+    double maxMem, maxSwap;
+    double memTotal;
+    double maxMemTotal;
+    std::deque<std::pair<double, double>> memSwapUsageHistory;
+    class PerformanceCounter;
+    std::unique_ptr<PerformanceCounter> performanceCounter;
+};
diff --git a/demos/common/monitors/presenter.cpp b/demos/common/monitors/presenter.cpp
new file mode 100644
index 00000000000..0cadc9d5279
--- /dev/null
+++ b/demos/common/monitors/presenter.cpp
@@ -0,0 +1,301 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <cctype>
+#include <iomanip>
+#include <numeric>
+
+#include "presenter.h"
+
+namespace {
+const std::map<int, MonitorType> keyToMonitorType{
+    {'C', MonitorType::CpuAverage},
+    {'D', MonitorType::DistributionCpu},
+    {'M', MonitorType::Memory}};
+
+std::set<MonitorType> strKeysToMonitorSet(const std::string& keys) {
+    std::set<MonitorType> enabledMonitors;
+    for (unsigned char key: keys) {
+        auto iter = keyToMonitorType.find(std::toupper(key));
+        if (keyToMonitorType.end() == iter) {
+            throw std::runtime_error("Unknown monitor type");
+        } else {
+            enabledMonitors.insert(iter->second);
+        }
+    }
+    return enabledMonitors;
+}
+}
+
+Presenter::Presenter(std::set<MonitorType> enabledMonitors,
+        int yPos,
+        cv::Size graphSize,
+        std::size_t historySize) :
+            yPos{yPos},
+            graphSize{graphSize},
+            graphPadding{std::max(1, static_cast<int>(graphSize.width * 0.05))},
+            historySize{historySize},
+            distributionCpuEnabled{false},
+            strStream{std::ios_base::app} {
+    for (MonitorType monitor : enabledMonitors) {
+        addRemoveMonitor(monitor);
+    }
+}
+
+Presenter::Presenter(const std::string& keys, int yPos, cv::Size graphSize, std::size_t historySize) :
+    Presenter{strKeysToMonitorSet(keys), yPos, graphSize, historySize} {}
+
+void Presenter::addRemoveMonitor(MonitorType monitor) {
+    unsigned updatedHistorySize = 1;
+    if (historySize > 1) {
+        int sampleStep = std::max(1, static_cast<int>(graphSize.width / (historySize - 1)));
+        // +1 to plot graphSize.width/sampleStep segments
+        // add round up to and an extra element if don't reach graph edge
+        updatedHistorySize = (graphSize.width + sampleStep - 1) / sampleStep + 1;
+    }
+    switch(monitor) {
+        case MonitorType::CpuAverage: {
+            if (cpuMonitor.getHistorySize() > 1 && distributionCpuEnabled) {
+                cpuMonitor.setHistorySize(1);
+            } else if (cpuMonitor.getHistorySize() > 1 && !distributionCpuEnabled) {
+                cpuMonitor.setHistorySize(0);
+            } else { // cpuMonitor.getHistorySize() <= 1
+                cpuMonitor.setHistorySize(updatedHistorySize);
+            }
+            break;
+        }
+        case MonitorType::DistributionCpu: {
+            if (distributionCpuEnabled) {
+                distributionCpuEnabled = false;
+                if (1 == cpuMonitor.getHistorySize()) { // cpuMonitor was used only for DistributionCpu => disable it
+                    cpuMonitor.setHistorySize(0);
+                }
+            } else {
+                distributionCpuEnabled = true;
+                cpuMonitor.setHistorySize(std::max(std::size_t{1}, cpuMonitor.getHistorySize()));
+            }
+            break;
+        }
+        case MonitorType::Memory: {
+            if (memoryMonitor.getHistorySize() > 1) {
+                memoryMonitor.setHistorySize(0);
+            } else {
+                memoryMonitor.setHistorySize(updatedHistorySize);
+            }
+            break;
+        }
+    }
+}
+
+void Presenter::handleKey(int key) {
+    key = std::toupper(key);
+    if ('H' == key) {
+        if (0 == cpuMonitor.getHistorySize() && memoryMonitor.getHistorySize() <= 1) {
+            addRemoveMonitor(MonitorType::CpuAverage);
+            addRemoveMonitor(MonitorType::DistributionCpu);
+            addRemoveMonitor(MonitorType::Memory);
+        } else {
+            cpuMonitor.setHistorySize(0);
+            distributionCpuEnabled = false;
+            memoryMonitor.setHistorySize(0);
+        }
+    } else {
+        auto iter = keyToMonitorType.find(key);
+        if (keyToMonitorType.end() != iter) {
+            addRemoveMonitor(iter->second);
+        }
+    }
+}
+
+void Presenter::drawGraphs(cv::Mat& frame) {
+    const std::chrono::steady_clock::time_point curTimeStamp = std::chrono::steady_clock::now();
+    if (curTimeStamp - prevTimeStamp >= std::chrono::milliseconds{1000}) {
+        prevTimeStamp = curTimeStamp;
+        if (0 != cpuMonitor.getHistorySize()) {
+            cpuMonitor.collectData();
+        }
+        if (memoryMonitor.getHistorySize() > 1) {
+            memoryMonitor.collectData();
+        }
+    }
+
+    int numberOfEnabledMonitors = (cpuMonitor.getHistorySize() > 1) + distributionCpuEnabled
+        + (memoryMonitor.getHistorySize() > 1);
+    int panelWidth = graphSize.width * numberOfEnabledMonitors
+        + std::max(0, numberOfEnabledMonitors - 1) * graphPadding;
+    while (panelWidth > frame.cols) {
+        panelWidth = std::max(0, panelWidth - graphSize.width - graphPadding);
+        --numberOfEnabledMonitors; // can't draw all monitors
+    }
+    int graphPos = std::max(0, (frame.cols - 1 - panelWidth) / 2);
+    int textGraphSplittingLine = graphSize.height / 5;
+    int graphRectHeight = graphSize.height - textGraphSplittingLine;
+    int sampleStep = 1;
+    unsigned possibleHistorySize = 1;
+    if (historySize > 1) {
+        sampleStep = std::max(1, static_cast<int>(graphSize.width / (historySize - 1)));
+        possibleHistorySize = (graphSize.width + sampleStep - 1) / sampleStep + 1;
+    }
+
+    if (cpuMonitor.getHistorySize() > 1 && possibleHistorySize > 1 && --numberOfEnabledMonitors >= 0) {
+        std::deque<std::vector<double>> lastHistory = cpuMonitor.getLastHistory();
+        cv::Mat graph = frame(cv::Rect{cv::Point{graphPos, yPos}, graphSize} & cv::Rect(0, 0, frame.cols, frame.rows));
+        graph = graph / 2 + cv::Scalar{127, 127, 127};
+
+        int lineXPos = graph.cols - 1;
+        std::vector<cv::Point> averageLoad(lastHistory.size());
+
+        for (int i = lastHistory.size() - 1; i >= 0; --i) {
+            double mean = std::accumulate(lastHistory[i].begin(), lastHistory[i].end(), 0.0) / lastHistory[i].size();
+            averageLoad[i] = {lineXPos, graphSize.height - static_cast<int>(mean * graphRectHeight)};
+            lineXPos -= sampleStep;
+        }
+
+        cv::polylines(graph, averageLoad, false, {255, 0, 0}, 2);
+        cv::rectangle(frame, cv::Rect{
+                cv::Point{graphPos, yPos + textGraphSplittingLine},
+                cv::Size{graphSize.width, graphSize.height - textGraphSplittingLine}
+            }, {0, 0, 0});
+        strStream.str("CPU");
+        if (!lastHistory.empty()) {
+            strStream << ": " << std::fixed << std::setprecision(1)
+                << std::accumulate(lastHistory.back().begin(), lastHistory.back().end(), 0.0)
+                    / lastHistory.back().size() * 100 << '%';
+        }
+        int baseline;
+        int textWidth = cv::getTextSize(strStream.str(),
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            1,
+            &baseline).width;
+        cv::putText(graph,
+            strStream.str(),
+            cv::Point{(graphSize.width - textWidth) / 2, textGraphSplittingLine - 1},
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            {70, 0, 0},
+            1);
+        graphPos += graphSize.width + graphPadding;
+    }
+
+    if (distributionCpuEnabled && --numberOfEnabledMonitors >= 0) {
+        std::deque<std::vector<double>> lastHistory = cpuMonitor.getLastHistory();
+        cv::Mat graph = frame(cv::Rect{cv::Point{graphPos, yPos}, graphSize} & cv::Rect(0, 0, frame.cols, frame.rows));
+        graph = graph / 2 + cv::Scalar{127, 127, 127};
+
+        if (!lastHistory.empty()) {
+            int rectXPos = 0;
+            int step = (graph.cols + lastHistory.back().size() - 1) / lastHistory.back().size(); // round up
+            double sum = 0;
+            for (double coreLoad : lastHistory.back()) {
+                sum += coreLoad;
+                int height = static_cast<int>(graphRectHeight * coreLoad);
+                cv::Rect pillar{cv::Point{rectXPos, graph.rows - height}, cv::Size{step, height}};
+                cv::rectangle(graph, pillar, {255, 0, 0}, cv::FILLED);
+                cv::rectangle(graph, pillar, {0, 0, 0});
+                rectXPos += step;
+            }
+            sum /= lastHistory.back().size();
+            int yLine = graph.rows - static_cast<int>(graphRectHeight * sum);
+            cv::line(graph, cv::Point{0, yLine}, cv::Point{graph.cols, yLine}, {0, 255, 0}, 2);
+        }
+        cv::Rect border{cv::Point{graphPos, yPos + textGraphSplittingLine},
+            cv::Size{graphSize.width, graphSize.height - textGraphSplittingLine}};
+        cv::rectangle(frame, border, {0, 0, 0});
+        strStream.str("Core load");
+        if (!lastHistory.empty()) {
+            strStream << ": " << std::fixed << std::setprecision(1)
+                << std::accumulate(lastHistory.back().begin(), lastHistory.back().end(), 0.0)
+                    / lastHistory.back().size() * 100 << '%';
+        }
+        int baseline;
+        int textWidth = cv::getTextSize(strStream.str(),
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            1,
+            &baseline).width;
+        cv::putText(graph,
+            strStream.str(),
+            cv::Point{(graphSize.width - textWidth) / 2, textGraphSplittingLine - 1},
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            {0, 70, 0});
+        graphPos += graphSize.width + graphPadding;
+    }
+
+    if (memoryMonitor.getHistorySize() > 1 && possibleHistorySize > 1 && --numberOfEnabledMonitors >= 0) {
+        std::deque<std::pair<double, double>> lastHistory = memoryMonitor.getLastHistory();
+        cv::Mat graph = frame(cv::Rect{cv::Point{graphPos, yPos}, graphSize} & cv::Rect(0, 0, frame.cols, frame.rows));
+        graph = graph / 2 + cv::Scalar{127, 127, 127};
+        int histxPos = graph.cols - 1;
+        double range = std::min(memoryMonitor.getMaxMemTotal() + memoryMonitor.getMaxSwap(),
+            (memoryMonitor.getMaxMem() + memoryMonitor.getMaxSwap()) * 1.2);
+        if (lastHistory.size() > 1) {
+            for (auto memUsageIt = lastHistory.rbegin(); memUsageIt != lastHistory.rend() - 1; ++memUsageIt) {
+                constexpr double SWAP_THRESHOLD = 10.0 / 1024; // 10 MiB
+                cv::Vec3b color =
+                    (memoryMonitor.getMemTotal() * 0.95 > memUsageIt->first) || (memUsageIt->second < SWAP_THRESHOLD) ?
+                        cv::Vec3b{0, 255, 255} :
+                        cv::Vec3b{0, 0, 255};
+                cv::Point right{histxPos,
+                    graph.rows - static_cast<int>(graphRectHeight * (memUsageIt->first + memUsageIt->second) / range)};
+                cv::Point left{histxPos - sampleStep,
+                    graph.rows - static_cast<int>(
+                        graphRectHeight * ((memUsageIt + 1)->first + (memUsageIt + 1)->second) / range)};
+                cv::line(graph, right, left, color, 2);
+                histxPos -= sampleStep;
+            }
+        }
+
+        cv::Rect border{cv::Point{graphPos, yPos + textGraphSplittingLine},
+            cv::Size{graphSize.width, graphSize.height - textGraphSplittingLine}};
+        cv::rectangle(frame, {border}, {0, 0, 0});
+        if (lastHistory.empty()) {
+            strStream.str("Memory");
+        } else {
+            strStream.str("");
+            strStream << std::fixed << std::setprecision(1) << lastHistory.back().first << " + "
+                << lastHistory.back().second << " GiB";
+        }
+        int baseline;
+        int textWidth = cv::getTextSize(strStream.str(),
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            1,
+            &baseline).width;
+        cv::putText(graph,
+            strStream.str(),
+            cv::Point{(graphSize.width - textWidth) / 2, textGraphSplittingLine - 1},
+            cv::FONT_HERSHEY_SIMPLEX,
+            textGraphSplittingLine * 0.04,
+            {0, 35, 35});
+    }
+}
+
+std::string Presenter::reportMeans() const {
+    std::ostringstream collectedDataStream;
+    collectedDataStream << std::fixed << std::setprecision(1);
+    if (cpuMonitor.getHistorySize() > 1) {
+        collectedDataStream << "Mean core utilization: ";
+        for (double mean : cpuMonitor.getMeanCpuLoad()) {
+            collectedDataStream << mean * 100 << "% ";
+        }
+        collectedDataStream << '\n';
+    }
+    if (distributionCpuEnabled) {
+        std::vector<double> meanCpuLoad = cpuMonitor.getMeanCpuLoad();
+        double mean = std::accumulate(meanCpuLoad.begin(), meanCpuLoad.end(), 0.0) / meanCpuLoad.size();
+        collectedDataStream << "Mean CPU utilization: " << mean * 100 << "%\n";
+    }
+    if (memoryMonitor.getHistorySize() > 1) {
+        collectedDataStream << "Memory mean usage: " << memoryMonitor.getMeanMem() << " GiB\n";
+        collectedDataStream << "Mean swap usage: " << memoryMonitor.getMeanSwap() << " GiB\n";
+    }
+    std::string collectedData = collectedDataStream.str();
+    // drop last \n because usually it is not expeted that printing an object starts a new line
+    if (!collectedData.empty()) {
+        return collectedData.substr(0, collectedData.size() - 1);
+    }
+    return collectedData;
+}
diff --git a/demos/common/monitors/presenter.h b/demos/common/monitors/presenter.h
new file mode 100644
index 00000000000..bb1c9566f98
--- /dev/null
+++ b/demos/common/monitors/presenter.h
@@ -0,0 +1,43 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <map>
+#include <ostream>
+#include <set>
+
+#include <opencv2/imgproc.hpp>
+
+#include "cpu_monitor.h"
+#include "memory_monitor.h"
+
+enum class MonitorType{CpuAverage, DistributionCpu, Memory};
+
+class Presenter {
+public:
+    explicit Presenter(std::set<MonitorType> enabledMonitors = {},
+        int yPos = 20,
+        cv::Size graphSize = {150, 60},
+        std::size_t historySize = 20);
+    explicit Presenter(const std::string& keys,
+        int yPos = 20,
+        cv::Size graphSize = {150, 60},
+        std::size_t historySize = 20);
+    void addRemoveMonitor(MonitorType monitor);
+    void handleKey(int key); // handles c, d, m, h keys
+    void drawGraphs(cv::Mat& frame);
+    std::string reportMeans() const;
+
+    const int yPos;
+    const cv::Size graphSize;
+    const int graphPadding;
+private:
+    std::chrono::steady_clock::time_point prevTimeStamp;
+    std::size_t historySize;
+    CpuMonitor cpuMonitor;
+    bool distributionCpuEnabled;
+    MemoryMonitor memoryMonitor;
+    std::ostringstream strStream;
+};
diff --git a/demos/common/monitors/query_wrapper.cpp b/demos/common/monitors/query_wrapper.cpp
new file mode 100644
index 00000000000..184a0e65ac4
--- /dev/null
+++ b/demos/common/monitors/query_wrapper.cpp
@@ -0,0 +1,22 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "query_wrapper.h"
+
+#include <windows.h>
+#include <system_error>
+
+QueryWrapper::QueryWrapper() {
+    PDH_STATUS status = PdhOpenQuery(NULL, NULL, &query);
+    if (ERROR_SUCCESS != status) {
+        throw std::system_error(status, std::system_category(), "PdhOpenQuery() failed");
+    }
+}
+QueryWrapper::~QueryWrapper() {
+    PdhCloseQuery(query);
+}
+
+QueryWrapper::operator PDH_HQUERY() const {
+    return query;
+}
diff --git a/demos/common/monitors/query_wrapper.h b/demos/common/monitors/query_wrapper.h
new file mode 100644
index 00000000000..ea0e5599e5b
--- /dev/null
+++ b/demos/common/monitors/query_wrapper.h
@@ -0,0 +1,17 @@
+// Copyright (C) 2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <pdh.h>
+class QueryWrapper {
+public:
+    QueryWrapper();
+    ~QueryWrapper();
+    QueryWrapper(const QueryWrapper&) = delete;
+    QueryWrapper& operator=(const QueryWrapper&) = delete;
+    operator PDH_HQUERY() const;
+private:
+    PDH_HQUERY query;
+};
diff --git a/demos/common/samples/args_helper.hpp b/demos/common/samples/args_helper.hpp
index fc193aeeab9..0fe9982533d 100644
--- a/demos/common/samples/args_helper.hpp
+++ b/demos/common/samples/args_helper.hpp
@@ -34,7 +34,7 @@
 inline void readInputFilesArguments(std::vector<std::string> &files, const std::string& arg) {
     struct stat sb;
     if (stat(arg.c_str(), &sb) != 0) {
-        if (arg.find("rtsp:") != 0) {
+        if (arg.compare(0, 5, "rtsp:") != 0) {
             slog::warn << "File " << arg << " cannot be opened!" << slog::endl;
             return;
         }
@@ -103,15 +103,18 @@ inline std::vector<std::string> split(const std::string &s, char delim) {
 }
 
 inline std::vector<std::string> parseDevices(const std::string& device_string) {
-    std::string comma_separated_devices = device_string;
-    const std::string::size_type colon_position = comma_separated_devices.find(":");
+    const std::string::size_type colon_position = device_string.find(":");
     if (colon_position != std::string::npos) {
-        comma_separated_devices = comma_separated_devices.substr(colon_position + 1);
+        std::string device_type = device_string.substr(0, colon_position);
+        if (device_type == "HETERO" || device_type == "MULTI") {
+            std::string comma_separated_devices = device_string.substr(colon_position + 1);
+            std::vector<std::string> devices = split(comma_separated_devices, ',');
+            for (auto& device : devices)
+                device = device.substr(0, device.find("("));
+            return devices;
+        }
     }
-    auto devices = split(comma_separated_devices, ',');
-    for (auto& device : devices)
-        device = device.substr(0, device.find("("));
-    return devices;
+    return {device_string};
 }
 
 inline std::map<std::string, uint32_t> parseValuePerDevice(const std::set<std::string>& devices,
diff --git a/demos/common/samples/classification_results.h b/demos/common/samples/classification_results.h
deleted file mode 100644
index 3cf0a2b06be..00000000000
--- a/demos/common/samples/classification_results.h
+++ /dev/null
@@ -1,92 +0,0 @@
-// Copyright (C) 2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-/**
- * @brief a header file with ouput classification results
- * @file classification_results.hpp
- */
-#include <string>
-#include <vector>
-#include <iostream>
-#include <utility>
-
-#include <ie_blob.h>
-
-/**
- * @class ClassificationResult
- * @brief A ClassificationResult creates an output table with results
- */
-class ClassificationResult {
-private:
-    const std::string _classidStr = "classid";
-    const std::string _probabilityStr = "probability";
-    const std::string _labelStr = "label";
-    size_t _nTop;
-    InferenceEngine::Blob::Ptr _outBlob;
-    const std::vector<std::string> _labels;
-    const std::vector<std::string> _imageNames;
-    const size_t _batchSize;
-
-    void printHeader() {
-        std::cout << _classidStr << " " << _probabilityStr;
-        if (!_labels.empty())
-            std::cout << " " << _labelStr;
-        std::string classidColumn(_classidStr.length(), '-');
-        std::string probabilityColumn(_probabilityStr.length(), '-');
-        std::string labelColumn(_labelStr.length(), '-');
-        std::cout << std::endl << classidColumn << " " << probabilityColumn;
-        if (!_labels.empty())
-            std::cout << " " << labelColumn;
-        std::cout << std::endl;
-    }
-
-public:
-    explicit ClassificationResult(InferenceEngine::Blob::Ptr output_blob,
-                                  std::vector<std::string> image_names = {},
-                                  size_t batch_size = 1,
-                                  size_t num_of_top = 10,
-                                  std::vector<std::string> labels = {}) :
-            _nTop(num_of_top),
-            _outBlob(std::move(output_blob)),
-            _labels(std::move(labels)),
-            _imageNames(std::move(image_names)),
-            _batchSize(batch_size) {
-        if (_imageNames.size() != _batchSize) {
-            throw std::logic_error("Batch size should be equal to the number of images.");
-        }
-    }
-
-    /**
-    * @brief prints formatted classification results
-    */
-    void print() {
-        /** This vector stores id's of top N results **/
-        std::vector<unsigned> results;
-        TopResults(_nTop, *_outBlob, results);
-
-        /** Print the result iterating over each batch **/
-        std::cout << std::endl << "Top " << _nTop << " results:" << std::endl << std::endl;
-        for (unsigned int image_id = 0; image_id < _batchSize; ++image_id) {
-            std::cout << "Image " << _imageNames[image_id] << std::endl << std::endl;
-            printHeader();
-
-            for (size_t id = image_id * _nTop, cnt = 0; id < (image_id + 1) * _nTop; ++cnt, ++id) {
-                std::cout.precision(7);
-                /** Getting probability for resulting class **/
-                const auto result = _outBlob->buffer().
-                        as<InferenceEngine::PrecisionTrait<InferenceEngine::Precision::FP32>::value_type*>()
-                [results[id] + image_id * (_outBlob->size() / _batchSize)];
-
-                std::cout << std::setw(static_cast<int>(_classidStr.length())) << std::left << results[id] << " ";
-                std::cout << std::left << std::setw(static_cast<int>(_probabilityStr.length())) << std::fixed << result;
-
-                if (!_labels.empty()) {
-                    std::cout << " " + _labels[results[id]];
-                }
-                std::cout << std::endl;
-            }
-            std::cout << std::endl;
-        }
-    }
-};
diff --git a/demos/common/samples/common.hpp b/demos/common/samples/common.hpp
index 1b48f329f9c..7a8542a5975 100644
--- a/demos/common/samples/common.hpp
+++ b/demos/common/samples/common.hpp
@@ -48,15 +48,9 @@ class ConsoleErrorListener : public InferenceEngine::IErrorListener {
     }
 };
 
-/**
- * @brief Trims from both ends (in place)
- * @param s - string to trim
- * @return trimmed string
- */
-inline std::string &trim(std::string &s) {
-    s.erase(s.begin(), std::find_if(s.begin(), s.end(), std::not1(std::ptr_fun<int, int>(std::isspace))));
-    s.erase(std::find_if(s.rbegin(), s.rend(), std::not1(std::ptr_fun<int, int>(std::isspace))).base(), s.end());
-    return s;
+template <typename T, std::size_t N>
+constexpr std::size_t arraySize(const T (&)[N]) noexcept {
+    return N;
 }
 
 /**
@@ -70,33 +64,6 @@ static UNUSED std::string fileNameNoExt(const std::string &filepath) {
     return filepath.substr(0, pos);
 }
 
-/**
-* @brief Get extension from filename
-* @param filename - name of the file which extension should be extracted
-* @return string with extracted file extension
-*/
-inline std::string fileExt(const std::string& filename) {
-    auto pos = filename.rfind('.');
-    if (pos == std::string::npos) return "";
-    return filename.substr(pos + 1);
-}
-
-static UNUSED std::ostream &operator<<(std::ostream &os, const InferenceEngine::Version *version) {
-    os << "\n\tAPI version ............ ";
-    if (nullptr == version) {
-        os << "UNKNOWN";
-    } else {
-        os << version->apiVersion.major << "." << version->apiVersion.minor;
-        if (nullptr != version->buildNumber) {
-            os << "\n\t" << "Build .................. " << version->buildNumber;
-        }
-        if (nullptr != version->description) {
-            os << "\n\t" << "Description ....... " << version->description;
-        }
-    }
-    return os;
-}
-
 inline std::ostream &operator<<(std::ostream &os, const InferenceEngine::Version &version) {
     os << "\t" << version.description << " version ......... ";
     os << version.apiVersion.major << "." << version.apiVersion.minor;
@@ -116,55 +83,6 @@ inline std::ostream &operator<<(std::ostream &os, const std::map<std::string, In
     return os;
 }
 
-static UNUSED std::vector<std::vector<size_t>> blobToImageOutputArray(InferenceEngine::TBlob<float>::Ptr output,
-                                                                      size_t *pWidth, size_t *pHeight,
-                                                                      size_t *pChannels) {
-    std::vector<std::vector<size_t>> outArray;
-    size_t W = 0, C = 0, H = 0;
-
-    auto outputDims = output->getTensorDesc().getDims();
-    if (outputDims.size() == 3) {
-        C = outputDims.at(0);
-        H = outputDims.at(1);
-        W = outputDims.at(2);
-    } else if (outputDims.size() == 4) {
-        C = outputDims.at(1);
-        H = outputDims.at(2);
-        W = outputDims.at(3);
-    } else if (outputDims.size() == 5) {
-        C = outputDims.at(1);
-        H = outputDims.at(3);
-        W = outputDims.at(4);
-    } else {
-        THROW_IE_EXCEPTION << "Output blob has unsupported layout " << output->getTensorDesc().getLayout();
-    }
-
-    // Get classes
-    const float *outData = output->data();
-    for (unsigned h = 0; h < H; h++) {
-        std::vector<size_t> row;
-        for (unsigned w = 0; w < W; w++) {
-            float max_value = outData[h * W + w];
-            size_t index = 0;
-            for (size_t c = 1; c < C; c++) {
-                size_t dataIndex = c * H * W + h * W + w;
-                if (outData[dataIndex] > max_value) {
-                    index = c;
-                    max_value = outData[dataIndex];
-                }
-            }
-            row.push_back(index);
-        }
-        outArray.push_back(row);
-    }
-
-    if (pWidth != nullptr) *pWidth = W;
-    if (pHeight != nullptr) *pHeight = H;
-    if (pChannels != nullptr) *pChannels = C;
-
-    return outArray;
-}
-
 /**
  * @class Color
  * @brief A Color class stores channels of a given color
@@ -186,385 +104,43 @@ class Color {
           unsigned char g,
           unsigned char b) : _r(r), _g(g), _b(b) {}
 
-    inline unsigned char red() {
+    inline unsigned char red() const {
         return _r;
     }
 
-    inline unsigned char blue() {
+    inline unsigned char blue() const {
         return _b;
     }
 
-    inline unsigned char green() {
+    inline unsigned char green() const {
         return _g;
     }
 };
 
-// TODO : keep only one version of writeOutputBMP
-
-/**
- * @brief Writes output data to image
- * @param name - image name
- * @param data - output data
- * @param classesNum - the number of classes
- * @return false if error else true
- */
-static UNUSED void writeOutputBmp(std::vector<std::vector<size_t>> data, size_t classesNum, std::ostream &outFile) {
-    unsigned int seed = (unsigned int) time(NULL);
-    // Known colors for training classes from Cityscape dataset
-    static std::vector<Color> colors = {
-        {128, 64,  128},
-        {232, 35,  244},
-        {70,  70,  70},
-        {156, 102, 102},
-        {153, 153, 190},
-        {153, 153, 153},
-        {30,  170, 250},
-        {0,   220, 220},
-        {35,  142, 107},
-        {152, 251, 152},
-        {180, 130, 70},
-        {60,  20,  220},
-        {0,   0,   255},
-        {142, 0,   0},
-        {70,  0,   0},
-        {100, 60,  0},
-        {90,  0,   0},
-        {230, 0,   0},
-        {32,  11,  119},
-        {0,   74,  111},
-        {81,  0,   81}
-    };
-
-    while (classesNum > colors.size()) {
-        static std::mt19937 rng(seed);
-        std::uniform_int_distribution<int> dist(0, 255);
-        Color color(dist(rng), dist(rng), dist(rng));
-        colors.push_back(color);
-    }
-
-    unsigned char file[14] = {
-            'B', 'M',           // magic
-            0, 0, 0, 0,         // size in bytes
-            0, 0,               // app data
-            0, 0,               // app data
-            40 + 14, 0, 0, 0      // start of data offset
-    };
-    unsigned char info[40] = {
-            40, 0, 0, 0,        // info hd size
-            0, 0, 0, 0,         // width
-            0, 0, 0, 0,         // height
-            1, 0,               // number color planes
-            24, 0,              // bits per pixel
-            0, 0, 0, 0,         // compression is none
-            0, 0, 0, 0,         // image bits size
-            0x13, 0x0B, 0, 0,   // horz resolution in pixel / m
-            0x13, 0x0B, 0, 0,   // vert resolution (0x03C3 = 96 dpi, 0x0B13 = 72 dpi)
-            0, 0, 0, 0,         // #colors in palette
-            0, 0, 0, 0,         // #important colors
-    };
-
-    auto height = data.size();
-    auto width = data.at(0).size();
-
-    if (height > (size_t) std::numeric_limits<int32_t>::max || width > (size_t) std::numeric_limits<int32_t>::max) {
-        THROW_IE_EXCEPTION << "File size is too big: " << height << " X " << width;
-    }
-
-    int padSize = static_cast<int>(4 - (width * 3) % 4) % 4;
-    int sizeData = static_cast<int>(width * height * 3 + height * padSize);
-    int sizeAll = sizeData + sizeof(file) + sizeof(info);
-
-    file[2] = (unsigned char) (sizeAll);
-    file[3] = (unsigned char) (sizeAll >> 8);
-    file[4] = (unsigned char) (sizeAll >> 16);
-    file[5] = (unsigned char) (sizeAll >> 24);
-
-    info[4] = (unsigned char) (width);
-    info[5] = (unsigned char) (width >> 8);
-    info[6] = (unsigned char) (width >> 16);
-    info[7] = (unsigned char) (width >> 24);
-
-    int32_t negativeHeight = -(int32_t) height;
-    info[8] = (unsigned char) (negativeHeight);
-    info[9] = (unsigned char) (negativeHeight >> 8);
-    info[10] = (unsigned char) (negativeHeight >> 16);
-    info[11] = (unsigned char) (negativeHeight >> 24);
-
-    info[20] = (unsigned char) (sizeData);
-    info[21] = (unsigned char) (sizeData >> 8);
-    info[22] = (unsigned char) (sizeData >> 16);
-    info[23] = (unsigned char) (sizeData >> 24);
-
-    outFile.write(reinterpret_cast<char *>(file), sizeof(file));
-    outFile.write(reinterpret_cast<char *>(info), sizeof(info));
-
-    unsigned char pad[3] = {0, 0, 0};
-
-    for (size_t y = 0; y < height; y++) {
-        for (size_t x = 0; x < width; x++) {
-            unsigned char pixel[3];
-            size_t index = data.at(y).at(x);
-            pixel[0] = colors.at(index).red();
-            pixel[1] = colors.at(index).green();
-            pixel[2] = colors.at(index).blue();
-            outFile.write(reinterpret_cast<char *>(pixel), 3);
-        }
-        outFile.write(reinterpret_cast<char *>(pad), padSize);
-    }
-}
-
-/**
-* @brief Writes output data to BMP image
-* @param name - image name
-* @param data - output data
-* @param height - height of the target image
-* @param width - width of the target image
-* @return false if error else true
-*/
-static UNUSED bool writeOutputBmp(std::string name, unsigned char *data, size_t height, size_t width) {
-    std::ofstream outFile;
-    outFile.open(name, std::ofstream::binary);
-    if (!outFile.is_open()) {
-        return false;
-    }
-
-    unsigned char file[14] = {
-        'B', 'M',           // magic
-        0, 0, 0, 0,         // size in bytes
-        0, 0,               // app data
-        0, 0,               // app data
-        40 + 14, 0, 0, 0      // start of data offset
-    };
-    unsigned char info[40] = {
-        40, 0, 0, 0,        // info hd size
-        0, 0, 0, 0,         // width
-        0, 0, 0, 0,         // height
-        1, 0,               // number color planes
-        24, 0,              // bits per pixel
-        0, 0, 0, 0,         // compression is none
-        0, 0, 0, 0,         // image bits size
-        0x13, 0x0B, 0, 0,   // horz resolution in pixel / m
-        0x13, 0x0B, 0, 0,   // vert resolution (0x03C3 = 96 dpi, 0x0B13 = 72 dpi)
-        0, 0, 0, 0,         // #colors in palette
-        0, 0, 0, 0,         // #important colors
-    };
-
-    if (height > (size_t)std::numeric_limits<int32_t>::max || width > (size_t)std::numeric_limits<int32_t>::max) {
-        THROW_IE_EXCEPTION << "File size is too big: " << height << " X " << width;
-    }
-
-    int padSize = static_cast<int>(4 - (width * 3) % 4) % 4;
-    int sizeData = static_cast<int>(width * height * 3 + height * padSize);
-    int sizeAll = sizeData + sizeof(file) + sizeof(info);
-
-    file[2] = (unsigned char)(sizeAll);
-    file[3] = (unsigned char)(sizeAll >> 8);
-    file[4] = (unsigned char)(sizeAll >> 16);
-    file[5] = (unsigned char)(sizeAll >> 24);
-
-    info[4] = (unsigned char)(width);
-    info[5] = (unsigned char)(width >> 8);
-    info[6] = (unsigned char)(width >> 16);
-    info[7] = (unsigned char)(width >> 24);
-
-    int32_t negativeHeight = -(int32_t)height;
-    info[8] = (unsigned char)(negativeHeight);
-    info[9] = (unsigned char)(negativeHeight >> 8);
-    info[10] = (unsigned char)(negativeHeight >> 16);
-    info[11] = (unsigned char)(negativeHeight >> 24);
-
-    info[20] = (unsigned char)(sizeData);
-    info[21] = (unsigned char)(sizeData >> 8);
-    info[22] = (unsigned char)(sizeData >> 16);
-    info[23] = (unsigned char)(sizeData >> 24);
-
-    outFile.write(reinterpret_cast<char *>(file), sizeof(file));
-    outFile.write(reinterpret_cast<char *>(info), sizeof(info));
-
-    unsigned char pad[3] = { 0, 0, 0 };
-
-    for (size_t y = 0; y < height; y++) {
-        for (size_t x = 0; x < width; x++) {
-            unsigned char pixel[3];
-            pixel[0] = data[y * width * 3 + x * 3];
-            pixel[1] = data[y * width * 3 + x * 3 + 1];
-            pixel[2] = data[y * width * 3 + x * 3 + 2];
-
-            outFile.write(reinterpret_cast<char *>(pixel), 3);
-        }
-        outFile.write(reinterpret_cast<char *>(pad), padSize);
-    }
-    return true;
-}
-
-
-/**
-* @brief Adds colored rectangles to the image
-* @param data - data where rectangles are put
-* @param height - height of the rectangle
-* @param width - width of the rectangle
-* @param rectangles - vector points for the rectangle, should be 4x compared to num classes
-* @param classes - vector of classes
-* @param thickness - thickness of a line (in pixels) to be used for bounding boxes
-*/
-static UNUSED void addRectangles(unsigned char *data, size_t height, size_t width, std::vector<int> rectangles, std::vector<int> classes, int thickness = 1) {
-    std::vector<Color> colors = {  // colors to be used for bounding boxes
-        { 128, 64,  128 },
-        { 232, 35,  244 },
-        { 70,  70,  70 },
-        { 156, 102, 102 },
-        { 153, 153, 190 },
-        { 153, 153, 153 },
-        { 30,  170, 250 },
-        { 0,   220, 220 },
-        { 35,  142, 107 },
-        { 152, 251, 152 },
-        { 180, 130, 70 },
-        { 60,  20,  220 },
-        { 0,   0,   255 },
-        { 142, 0,   0 },
-        { 70,  0,   0 },
-        { 100, 60,  0 },
-        { 90,  0,   0 },
-        { 230, 0,   0 },
-        { 32,  11,  119 },
-        { 0,   74,  111 },
-        { 81,  0,   81 }
-    };
-    if (rectangles.size() % 4 != 0 || rectangles.size() / 4 != classes.size()) {
-        return;
-    }
-
-    for (size_t i = 0; i < classes.size(); i++) {
-        int x = rectangles.at(i * 4);
-        int y = rectangles.at(i * 4 + 1);
-        int w = rectangles.at(i * 4 + 2);
-        int h = rectangles.at(i * 4 + 3);
-
-        int cls = classes.at(i) % colors.size();  // color of a bounding box line
-
-        if (x < 0) x = 0;
-        if (y < 0) y = 0;
-        if (w < 0) w = 0;
-        if (h < 0) h = 0;
-
-        if (static_cast<std::size_t>(x) >= width) { x = width - 1; w = 0; thickness = 1; }
-        if (static_cast<std::size_t>(y) >= height) { y = height - 1; h = 0; thickness = 1; }
-
-        if (static_cast<std::size_t>(x + w) >= width) { w = width - x - 1; }
-        if (static_cast<std::size_t>(y + h) >= height) { h = height - y - 1; }
-
-        thickness = std::min(std::min(thickness, w / 2 + 1), h / 2 + 1);
-
-        size_t shift_first;
-        size_t shift_second;
-        for (int t = 0; t < thickness; t++) {
-            shift_first = (y + t) * width * 3;
-            shift_second = (y + h - t) * width * 3;
-            for (int ii = x; ii < x + w + 1; ii++) {
-                data[shift_first + ii * 3] = colors.at(cls).red();
-                data[shift_first + ii * 3 + 1] = colors.at(cls).green();
-                data[shift_first + ii * 3 + 2] = colors.at(cls).blue();
-                data[shift_second + ii * 3] = colors.at(cls).red();
-                data[shift_second + ii * 3 + 1] = colors.at(cls).green();
-                data[shift_second + ii * 3 + 2] = colors.at(cls).blue();
-            }
-        }
-
-        for (int t = 0; t < thickness; t++) {
-            shift_first = (x + t) * 3;
-            shift_second = (x + w - t) * 3;
-            for (int ii = y; ii < y + h + 1; ii++) {
-                data[shift_first + ii * width * 3] = colors.at(cls).red();
-                data[shift_first + ii * width * 3 + 1] = colors.at(cls).green();
-                data[shift_first + ii * width * 3 + 2] = colors.at(cls).blue();
-                data[shift_second + ii * width * 3] = colors.at(cls).red();
-                data[shift_second + ii * width * 3 + 1] = colors.at(cls).green();
-                data[shift_second + ii * width * 3 + 2] = colors.at(cls).blue();
-            }
-        }
-    }
-}
-
-
-
-/**
- * Write output data to image
- * \param name - image name
- * \param data - output data
- * \param classesNum - the number of classes
- * \return false if error else true
- */
-
-static UNUSED bool writeOutputBmp(unsigned char *data, size_t height, size_t width, std::ostream &outFile) {
-    unsigned char file[14] = {
-            'B', 'M',           // magic
-            0, 0, 0, 0,         // size in bytes
-            0, 0,               // app data
-            0, 0,               // app data
-            40+14, 0, 0, 0      // start of data offset
-    };
-    unsigned char info[40] = {
-            40, 0, 0, 0,        // info hd size
-            0, 0, 0, 0,         // width
-            0, 0, 0, 0,         // height
-            1, 0,               // number color planes
-            24, 0,              // bits per pixel
-            0, 0, 0, 0,         // compression is none
-            0, 0, 0, 0,         // image bits size
-            0x13, 0x0B, 0, 0,   // horz resolution in pixel / m
-            0x13, 0x0B, 0, 0,   // vert resolution (0x03C3 = 96 dpi, 0x0B13 = 72 dpi)
-            0, 0, 0, 0,         // #colors in palette
-            0, 0, 0, 0,         // #important colors
-    };
-
-    if (height > (size_t)std::numeric_limits<int32_t>::max || width > (size_t)std::numeric_limits<int32_t>::max) {
-        THROW_IE_EXCEPTION << "File size is too big: " << height << " X " << width;
-    }
-
-    int padSize  = static_cast<int>(4 - (width * 3) % 4) % 4;
-    int sizeData = static_cast<int>(width * height * 3 + height * padSize);
-    int sizeAll  = sizeData + sizeof(file) + sizeof(info);
-
-    file[ 2] = (unsigned char)(sizeAll      );
-    file[ 3] = (unsigned char)(sizeAll >>  8);
-    file[ 4] = (unsigned char)(sizeAll >> 16);
-    file[ 5] = (unsigned char)(sizeAll >> 24);
-
-    info[ 4] = (unsigned char)(width      );
-    info[ 5] = (unsigned char)(width >>  8);
-    info[ 6] = (unsigned char)(width >> 16);
-    info[ 7] = (unsigned char)(width >> 24);
-
-    int32_t negativeHeight = -(int32_t)height;
-    info[ 8] = (unsigned char)(negativeHeight      );
-    info[ 9] = (unsigned char)(negativeHeight >>  8);
-    info[10] = (unsigned char)(negativeHeight >> 16);
-    info[11] = (unsigned char)(negativeHeight >> 24);
-
-    info[20] = (unsigned char)(sizeData      );
-    info[21] = (unsigned char)(sizeData >>  8);
-    info[22] = (unsigned char)(sizeData >> 16);
-    info[23] = (unsigned char)(sizeData >> 24);
-
-    outFile.write(reinterpret_cast<char*>(file), sizeof(file));
-    outFile.write(reinterpret_cast<char*>(info), sizeof(info));
-
-    unsigned char pad[3] = {0, 0, 0};
-
-    for (size_t y = 0; y < height; y++) {
-        for (size_t x = 0; x < width; x++) {
-            unsigned char pixel[3];
-            pixel[0] = data[y*width*3 + x*3];
-            pixel[1] = data[y*width*3 + x*3 + 1];
-            pixel[2] = data[y*width*3 + x*3 + 2];
-            outFile.write(reinterpret_cast<char *>(pixel), 3);
-        }
-        outFile.write(reinterpret_cast<char *>(pad), padSize);
-    }
-
-    return true;
-}
+// Known colors for training classes from the Cityscapes dataset
+static UNUSED const Color CITYSCAPES_COLORS[] = {
+    { 128, 64,  128 },
+    { 232, 35,  244 },
+    { 70,  70,  70 },
+    { 156, 102, 102 },
+    { 153, 153, 190 },
+    { 153, 153, 153 },
+    { 30,  170, 250 },
+    { 0,   220, 220 },
+    { 35,  142, 107 },
+    { 152, 251, 152 },
+    { 180, 130, 70 },
+    { 60,  20,  220 },
+    { 0,   0,   255 },
+    { 142, 0,   0 },
+    { 70,  0,   0 },
+    { 100, 60,  0 },
+    { 90,  0,   0 },
+    { 230, 0,   0 },
+    { 32,  11,  119 },
+    { 0,   74,  111 },
+    { 81,  0,   81 }
+};
 
 static std::vector<std::pair<std::string, InferenceEngine::InferenceEngineProfileInfo>>
 perfCountersSorted(std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> perfMap) {
@@ -581,7 +157,7 @@ perfCountersSorted(std::map<std::string, InferenceEngine::InferenceEngineProfile
 }
 
 static UNUSED void printPerformanceCounts(const std::map<std::string, InferenceEngine::InferenceEngineProfileInfo>& performanceMap,
-                                          std::ostream &stream, std::string deviceName,
+                                          std::ostream &stream, const std::string &deviceName,
                                           bool bshowHeader = true) {
     long long totalTime = 0;
     // Print performance counts
@@ -668,353 +244,6 @@ inline std::string getFullDeviceName(InferenceEngine::Core& ie, std::string devi
     }
 }
 
-/**
- * @brief This class represents an object that is found by an object detection net
- */
-class DetectedObject {
-public:
-    int objectType;
-    float xmin, xmax, ymin, ymax, prob;
-    bool difficult;
-
-    DetectedObject(int _objectType, float _xmin, float _ymin, float _xmax, float _ymax, float _prob, bool _difficult = false)
-        : objectType(_objectType), xmin(_xmin), xmax(_xmax), ymin(_ymin), ymax(_ymax), prob(_prob), difficult(_difficult) {
-    }
-
-    DetectedObject(const DetectedObject& other) = default;
-
-    static float ioU(const DetectedObject& detectedObject1_, const DetectedObject& detectedObject2_) {
-        // Add small space to eliminate empty squares
-        float epsilon = 0;  // 1e-5f;
-
-        DetectedObject detectedObject1(detectedObject1_.objectType,
-                (detectedObject1_.xmin - epsilon),
-                (detectedObject1_.ymin - epsilon),
-                (detectedObject1_.xmax- epsilon),
-                (detectedObject1_.ymax- epsilon), detectedObject1_.prob);
-        DetectedObject detectedObject2(detectedObject2_.objectType,
-                (detectedObject2_.xmin + epsilon),
-                (detectedObject2_.ymin + epsilon),
-                (detectedObject2_.xmax),
-                (detectedObject2_.ymax), detectedObject2_.prob);
-
-        if (detectedObject1.objectType != detectedObject2.objectType) {
-            // objects are different, so the result is 0
-            return 0.0f;
-        }
-
-        if (detectedObject1.xmax < detectedObject1.xmin) return 0.0;
-        if (detectedObject1.ymax < detectedObject1.ymin) return 0.0;
-        if (detectedObject2.xmax < detectedObject2.xmin) return 0.0;
-        if (detectedObject2.ymax < detectedObject2.ymin) return 0.0;
-
-
-        float xmin = (std::max)(detectedObject1.xmin, detectedObject2.xmin);
-        float ymin = (std::max)(detectedObject1.ymin, detectedObject2.ymin);
-        float xmax = (std::min)(detectedObject1.xmax, detectedObject2.xmax);
-        float ymax = (std::min)(detectedObject1.ymax, detectedObject2.ymax);
-
-        // Caffe adds 1 to every length if the box isn't normalized. So do we...
-        float addendum;
-        if (xmax > 1 || ymax > 1)
-            addendum = 1;
-        else
-            addendum = 0;
-
-        // intersection
-        float intr;
-        if ((xmax >= xmin) && (ymax >= ymin)) {
-            intr = (addendum + xmax - xmin) * (addendum + ymax - ymin);
-        } else {
-            intr = 0.0f;
-        }
-
-        // union
-        float square1 = (addendum + detectedObject1.xmax - detectedObject1.xmin) * (addendum + detectedObject1.ymax - detectedObject1.ymin);
-        float square2 = (addendum + detectedObject2.xmax - detectedObject2.xmin) * (addendum + detectedObject2.ymax - detectedObject2.ymin);
-
-        float unn = square1 + square2 - intr;
-
-        return static_cast<float>(intr) / unn;
-    }
-
-    DetectedObject scale(float scale_x, float scale_y) const {
-        return DetectedObject(objectType, xmin * scale_x, ymin * scale_y, xmax * scale_x, ymax * scale_y, prob, difficult);
-    }
-};
-
-class ImageDescription {
-public:
-    const std::list<DetectedObject> alist;
-    const bool check_probs;
-
-    explicit ImageDescription(const std::list<DetectedObject> &_alist, bool _check_probs = false)
-            : alist(_alist), check_probs(_check_probs) {
-    }
-
-    static float ioUMultiple(const ImageDescription &detectedObjects, const ImageDescription &desiredObjects) {
-        const ImageDescription *detectedObjectsSmall, *detectedObjectsBig;
-        bool check_probs = desiredObjects.check_probs;
-
-        if (detectedObjects.alist.size() < desiredObjects.alist.size()) {
-            detectedObjectsSmall = &detectedObjects;
-            detectedObjectsBig = &desiredObjects;
-        } else {
-            detectedObjectsSmall = &desiredObjects;
-            detectedObjectsBig = &detectedObjects;
-        }
-
-        std::list<DetectedObject> doS = detectedObjectsSmall->alist;
-        std::list<DetectedObject> doB = detectedObjectsBig->alist;
-
-        float fullScore = 0.0f;
-        while (doS.size() > 0) {
-            float score = 0.0f;
-            std::list<DetectedObject>::iterator bestJ = doB.end();
-            for (auto j = doB.begin(); j != doB.end(); j++) {
-                float curscore = DetectedObject::ioU(*doS.begin(), *j);
-                if (score < curscore) {
-                    score = curscore;
-                    bestJ = j;
-                }
-            }
-
-            float coeff = 1.0;
-            if (check_probs) {
-                if (bestJ != doB.end()) {
-                    float mn = std::min((*bestJ).prob, (*doS.begin()).prob);
-                    float mx = std::max((*bestJ).prob, (*doS.begin()).prob);
-
-                    coeff = mn/mx;
-                }
-            }
-
-            doS.pop_front();
-            if (bestJ != doB.end()) doB.erase(bestJ);
-            fullScore += coeff * score;
-        }
-        fullScore /= detectedObjectsBig->alist.size();
-
-
-        return fullScore;
-    }
-
-    ImageDescription scale(float scale_x, float scale_y) const {
-        std::list<DetectedObject> slist;
-        for (auto& dob : alist) {
-            slist.push_back(dob.scale(scale_x, scale_y));
-        }
-        return ImageDescription(slist, check_probs);
-    }
-};
-
-struct AveragePrecisionCalculator {
-private:
-    enum MatchKind {
-        TruePositive, FalsePositive
-    };
-
-    /**
-     * Here we count all TP and FP matches for all the classes in all the images.
-     */
-    std::map<int, std::vector<std::pair<double, MatchKind>>> matches;
-
-    std::map<int, int> N;
-
-    double threshold;
-
-    static bool SortBBoxDescend(const DetectedObject& bbox1, const DetectedObject& bbox2) {
-      return bbox1.prob > bbox2.prob;
-    }
-
-    static bool SortPairDescend(const std::pair<double, MatchKind>& p1, const std::pair<double, MatchKind>& p2) {
-      return p1.first > p2.first;
-    }
-
-public:
-    explicit AveragePrecisionCalculator(double _threshold) : threshold(_threshold) { }
-
-    // gt_bboxes -> des
-    // bboxes -> det
-
-    void consumeImage(const ImageDescription &detectedObjects, const ImageDescription &desiredObjects) {
-        // Collecting IoU values
-        std::vector<bool> visited(desiredObjects.alist.size(), false);
-        std::vector<DetectedObject> bboxes{ std::begin(detectedObjects.alist), std::end(detectedObjects.alist) };
-        std::sort(bboxes.begin(), bboxes.end(), SortBBoxDescend);
-
-
-        for (auto&& detObj : bboxes) {
-            // Searching for the best match to this detection
-            // Searching for desired object
-            float overlap_max = -1;
-            int jmax = -1;
-            auto desmax = desiredObjects.alist.end();
-
-            int j = 0;
-            for (auto desObj = desiredObjects.alist.begin(); desObj != desiredObjects.alist.end(); desObj++, j++) {
-                double iou = DetectedObject::ioU(detObj, *desObj);
-                if (iou > overlap_max) {
-                    overlap_max = static_cast<float>(iou);
-                    jmax = j;
-                    desmax = desObj;
-                }
-            }
-
-            MatchKind mk;
-            if (overlap_max >= threshold) {
-                if (!desmax->difficult) {
-                    if (!visited[jmax]) {
-                        mk = TruePositive;
-                        visited[jmax] = true;
-                    } else {
-                        mk = FalsePositive;
-                    }
-                    matches[detObj.objectType].push_back(std::make_pair(detObj.prob, mk));
-                }
-            } else {
-                mk = FalsePositive;
-                matches[detObj.objectType].push_back(std::make_pair(detObj.prob, mk));
-            }
-        }
-
-        for (auto desObj = desiredObjects.alist.begin(); desObj != desiredObjects.alist.end(); desObj++) {
-            if (!desObj->difficult) {
-                N[desObj->objectType]++;
-                }
-            }
-        }
-
-    std::map<int, double> calculateAveragePrecisionPerClass() const {
-        /**
-         * Precision-to-TP curve per class (a variation of precision-to-recall curve without dividing into N)
-         */
-        std::map<int, std::map<int, double>> precisionToTP;
-
-
-        std::map<int, double> res;
-
-        for (auto m : matches) {
-            // Sorting
-            std::sort(m.second.begin(), m.second.end(), SortPairDescend);
-
-            int clazz = m.first;
-            int TP = 0, FP = 0;
-
-            std::vector<double> prec;
-            std::vector<double> rec;
-
-            for (auto mm : m.second) {
-                // Here we are descending in a probability value
-                MatchKind mk = mm.second;
-                if (mk == TruePositive) TP++;
-                else if (mk == FalsePositive) FP++;
-
-                double precision = static_cast<double>(TP) / (TP + FP);
-                double recall = 0;
-                if (N.find(clazz) != N.end()) {
-                    recall = static_cast<double>(TP) / N.at(clazz);
-                }
-
-                prec.push_back(precision);
-                rec.push_back(recall);
-            }
-
-            int num = rec.size();
-
-            // 11point from Caffe
-            double ap = 0;
-            std::vector<float> max_precs(11, 0.);
-            int start_idx = num - 1;
-            for (int j = 10; j >= 0; --j) {
-                for (int i = start_idx; i >= 0; --i) {
-                    if (rec[i] < j / 10.) {
-                        start_idx = i;
-                        if (j > 0) {
-                            max_precs[j-1] = max_precs[j];
-                        }
-                        break;
-                    } else {
-                        if (max_precs[j] < prec[i]) {
-                            max_precs[j] = static_cast<float>(prec[i]);
-                        }
-                    }
-                }
-            }
-            for (int j = 10; j >= 0; --j) {
-                ap += max_precs[j] / 11;
-            }
-            res[clazz] = ap;
-        }
-
-        return res;
-    }
-};
-
-/**
-* @brief Adds colored rectangles to the image
-* @param data - data where rectangles are put
-* @param height - height of the rectangle
-* @param width - width of the rectangle
-* @param detectedObjects - vector of detected objects
-*/
-static UNUSED void addRectangles(unsigned char *data, size_t height, size_t width, std::vector<DetectedObject> detectedObjects) {
-    std::vector<Color> colors = {
-        { 128, 64,  128 },
-        { 232, 35,  244 },
-        { 70,  70,  70 },
-        { 156, 102, 102 },
-        { 153, 153, 190 },
-        { 153, 153, 153 },
-        { 30,  170, 250 },
-        { 0,   220, 220 },
-        { 35,  142, 107 },
-        { 152, 251, 152 },
-        { 180, 130, 70 },
-        { 60,  20,  220 },
-        { 0,   0,   255 },
-        { 142, 0,   0 },
-        { 70,  0,   0 },
-        { 100, 60,  0 },
-        { 90,  0,   0 },
-        { 230, 0,   0 },
-        { 32,  11,  119 },
-        { 0,   74,  111 },
-        { 81,  0,   81 }
-    };
-
-    for (size_t i = 0; i < detectedObjects.size(); i++) {
-        int cls = detectedObjects[i].objectType % colors.size();
-
-        int xmin = static_cast<int>(detectedObjects[i].xmin * width);
-        int xmax = static_cast<int>(detectedObjects[i].xmax * width);
-        int ymin = static_cast<int>(detectedObjects[i].ymin * height);
-        int ymax = static_cast<int>(detectedObjects[i].ymax * height);
-
-        size_t shift_first = ymin*width * 3;
-        size_t shift_second = ymax*width * 3;
-        for (int x = xmin; x < xmax; x++) {
-            data[shift_first + x * 3] = colors.at(cls).red();
-            data[shift_first + x * 3 + 1] = colors.at(cls).green();
-            data[shift_first + x * 3 + 2] = colors.at(cls).blue();
-            data[shift_second + x * 3] = colors.at(cls).red();
-            data[shift_second + x * 3 + 1] = colors.at(cls).green();
-            data[shift_second + x * 3 + 2] = colors.at(cls).blue();
-        }
-
-        shift_first = xmin * 3;
-        shift_second = xmax * 3;
-        for (int y = ymin; y < ymax; y++) {
-            data[shift_first + y*width * 3] = colors.at(cls).red();
-            data[shift_first + y*width * 3 + 1] = colors.at(cls).green();
-            data[shift_first + y*width * 3 + 2] = colors.at(cls).blue();
-            data[shift_second + y*width * 3] = colors.at(cls).red();
-            data[shift_second + y*width * 3 + 1] = colors.at(cls).green();
-            data[shift_second + y*width * 3 + 2] = colors.at(cls).blue();
-        }
-    }
-}
-
 inline std::size_t getTensorWidth(const InferenceEngine::TensorDesc& desc) {
     const auto& layout = desc.getLayout();
     const auto& dims = desc.getDims();
@@ -1120,4 +349,5 @@ inline void showAvailableDevices() {
     for (const auto& device : devices) {
         std::cout << "  " << device;
     }
+    std::cout << std::endl;
 }
diff --git a/demos/common/samples/console_progress.hpp b/demos/common/samples/console_progress.hpp
deleted file mode 100644
index 5edfea80fbc..00000000000
--- a/demos/common/samples/console_progress.hpp
+++ /dev/null
@@ -1,90 +0,0 @@
-// Copyright (C) 2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <iostream>
-#include <iomanip>
-
-/**
- * @class ConsoleProgress
- * @brief A ConsoleProgress class provides functionality for printing progress dynamics
- */
-class ConsoleProgress {
-    static const int DEFAULT_DETALIZATION = 20;
-
-    size_t total;
-    size_t current = 0;
-    bool stream_output;
-    size_t detalization;
-
-public:
-    /**
-    * @brief A constructor of ConsoleProgress class
-    * @param _total - maximum value that is correspondent to 100%
-    * @param _detalization - number of symbols(.) to use to represent progress
-    */
-    explicit ConsoleProgress(size_t _total, bool _stream_output = false, size_t _detalization = DEFAULT_DETALIZATION) :
-            total(_total), detalization(_detalization) {
-        stream_output = _stream_output;
-        if (total == 0) {
-            total = 1;
-        }
-        std::cout << std::unitbuf;
-    }
-
-    /**
-     * @brief Shows progress with current data. Progress is shown from the beginning of the current line.
-     * @return
-     */
-    void showProgress() const {
-        std::stringstream strm;
-        if (!stream_output) {
-            strm << '\r';
-        }
-        strm << "Progress: [";
-        size_t i = 0;
-        for (; i < detalization * current / total; i++) {
-            strm << ".";
-        }
-        for (; i < detalization; i++) {
-            strm << " ";
-        }
-        strm << "] " << std::fixed << std::setprecision(2) << 100 * static_cast<float>(current) / total << "% done";
-        if (stream_output) {
-            std::cout << strm.str() << std::endl;
-        } else {
-            std::cout << strm.str() << std::flush;
-        }
-    }
-
-    /**
-     * @brief Updates current value and progressbar
-     * @param newProgress - new value to represent
-     */
-    void updateProgress(size_t newProgress) {
-        current = newProgress;
-        if (current > total) current = total;
-        showProgress();
-    }
-
-    /**
-     * @brief Adds value to currently represented and redraw progressbar
-     * @param add - value to add
-     */
-    void addProgress(int add) {
-        if (add < 0 && -add > static_cast<int>(current)) {
-            add = -static_cast<int>(current);
-        }
-        updateProgress(current + add);
-    }
-
-    /**
-     * @brief Output end line.
-     * @return
-     */
-    void finish() {
-        std::cerr << std::nounitbuf << "\n";
-    }
-};
diff --git a/demos/common/samples/csv_dumper.hpp b/demos/common/samples/csv_dumper.hpp
deleted file mode 100644
index 4dbcfa19f38..00000000000
--- a/demos/common/samples/csv_dumper.hpp
+++ /dev/null
@@ -1,98 +0,0 @@
-// Copyright (C) 2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <fstream>
-#include <iostream>
-#include <sstream>
-#include <string>
-#include <time.h>
-
-#include <samples/slog.hpp>
-
-/**
- * @class CsvDumper
- * @brief A CsvDumper class provides functionality for dumping the values in CSV files
- */
-class CsvDumper {
-    std::ofstream file;
-    std::string filename;
-    bool canDump = true;
-    char delimiter = ';';
-
-    std::string generateFilename() {
-        std::stringstream filename;
-        filename << "dumpfile-";
-        filename << time(nullptr);
-        filename << ".csv";
-        return filename.str();
-    }
-
-public:
-    /**
-     * @brief A constructor. Disables dumping in case dump file cannot be created
-     * @param enabled - True if dumping is enabled by default.
-     * @param name - name of file to dump to. File won't be created if first parameter is false.
-     */
-    explicit CsvDumper(bool enabled = true, const std::string& name = "") : canDump(enabled) {
-        if (!canDump) {
-            return;
-        }
-        filename = (name == "" ? generateFilename() : name);
-        file.open(filename, std::ios::out);
-        if (!file) {
-            slog::warn << "Cannot create dump file! Disabling dump." << slog::endl;
-            canDump = false;
-        }
-    }
-
-    /**
-     * @brief Sets a delimiter to use in csv file
-     * @param c - Delimiter char
-     * @return
-     */
-    void setDelimiter(char c) {
-        delimiter = c;
-    }
-
-    /**
-     * @brief Overloads operator to organize streaming values to file. Does nothing if dumping is disabled
-     *        Adds delimiter at the end of value provided
-     * @param add - value to add to dump
-     * @return reference to same object
-     */
-    template<class T>
-    CsvDumper& operator<<(const T& add) {
-        if (canDump) {
-            file << add << delimiter;
-        }
-        return *this;
-    }
-
-    /**
-     * @brief Finishes line in dump file. Does nothing if dumping is disabled
-     */
-    void endLine() {
-        if (canDump) {
-            file << "\n";
-        }
-    }
-
-    /**
-     * @brief Gets information if dump is enabled.
-     * @return true if dump is enabled and file was successfully created
-     */
-    bool dumpEnabled() {
-        return canDump;
-    }
-
-    /**
-     * @brief Gets name of a dump file
-     * @return name of a dump file
-     */
-    std::string getFilename() const {
-        return filename;
-    }
-};
diff --git a/demos/common/samples/ocv_common.hpp b/demos/common/samples/ocv_common.hpp
index 770b0d7df75..ee29eca0f1c 100644
--- a/demos/common/samples/ocv_common.hpp
+++ b/demos/common/samples/ocv_common.hpp
@@ -24,6 +24,9 @@ void matU8ToBlob(const cv::Mat& orig_image, InferenceEngine::Blob::Ptr& blob, in
     const size_t width = blobSize[3];
     const size_t height = blobSize[2];
     const size_t channels = blobSize[1];
+    if (static_cast<size_t>(orig_image.channels()) != channels) {
+        THROW_IE_EXCEPTION << "The number of channels for net input and image must match";
+    }
     T* blob_data = blob->buffer().as<T*>();
 
     cv::Mat resized_image(orig_image);
diff --git a/demos/common/samples/slog.hpp b/demos/common/samples/slog.hpp
index 186c2cf0a6d..f3b34f4e95f 100644
--- a/demos/common/samples/slog.hpp
+++ b/demos/common/samples/slog.hpp
@@ -42,7 +42,7 @@ class LogStream {
 
 public:
     /**
-     * @brief A constructor. Creates an LogStream object
+     * @brief A constructor. Creates a LogStream object
      * @param prefix The prefix to print
      */
     LogStream(const std::string &prefix, std::ostream& log_stream)
diff --git a/demos/common/vpu/vpu_tools_common.hpp b/demos/common/vpu/vpu_tools_common.hpp
deleted file mode 100644
index e2185a8b955..00000000000
--- a/demos/common/vpu/vpu_tools_common.hpp
+++ /dev/null
@@ -1,27 +0,0 @@
-// Copyright (C) 2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <string>
-#include <map>
-
-static std::map<std::string, std::string> parseConfig(const std::string &configName, char comment = '#') {
-    std::map<std::string, std::string> config = {};
-
-    std::ifstream file(configName);
-    if (!file.is_open()) {
-        return config;
-    }
-
-    std::string key, value;
-    while (file >> key >> value) {
-        if (key.empty() || key[0] == comment) {
-            continue;
-        }
-        config[key] = value;
-    }
-
-    return config;
-}
diff --git a/demos/crossroad_camera_demo/CMakeLists.txt b/demos/crossroad_camera_demo/CMakeLists.txt
index 0ba0f10f725..d3c76ab36ba 100644
--- a/demos/crossroad_camera_demo/CMakeLists.txt
+++ b/demos/crossroad_camera_demo/CMakeLists.txt
@@ -5,4 +5,5 @@
 ie_add_sample(NAME crossroad_camera_demo
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/crossroad_camera_demo.hpp"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/crossroad_camera_demo/README.md b/demos/crossroad_camera_demo/README.md
index e5964695c37..300986acb25 100644
--- a/demos/crossroad_camera_demo/README.md
+++ b/demos/crossroad_camera_demo/README.md
@@ -5,7 +5,7 @@ This demo provides an inference pipeline for persons' detection, recognition and
 * `person-vehicle-bike-detection-crossroad-0078`, which is a primary detection network for finding the persons (and other objects if needed)
 * `person-attributes-recognition-crossroad-0230`, which is executed on top of the results from the first network and
 reports person attributes like gender, has hat, has long-sleeved clothes
-* `person-reidentification-retail-0079`, which is executed on top of the results from the first network and prints
+* `person-reidentification-retail-0031`, which is executed on top of the results from the first network and prints
 a vector of features for each detected person. This vector is used to conclude if it is already detected person or not.
 
 For more information about the pre-trained models, refer to the [model documentation](../../models/intel/index.md).
@@ -36,7 +36,7 @@ REID value is assigned. Otherwise, the vector is added to a global list, and new
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./crossroad_camera_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -62,6 +62,7 @@ Options:
     -t_reid                      Optional. Cosine similarity threshold between two vectors for person reidentification.
     -no_show                     Optional. No show processed video.
     -auto_resize                 Optional. Enables resizable input with support of ROI crop & auto resize.
+    -u                           Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields the usage message given above and an error message.
@@ -87,7 +88,7 @@ If Person Attributes Recognition or Person Reidentification Retail are enabled,
 
 > **NOTE**: On VPU devices (Intel® Movidius™ Neural Compute Stick, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs) this demo has been tested on the following Model Downloader available topologies: 
 >* `person-attributes-recognition-crossroad-0230`
->* `person-reidentification-retail-0079`
+>* `person-reidentification-retail-0031`
 >* `person-vehicle-bike-detection-crossroad-0078`
 > Other models may produce unexpected results on these devices.
 
diff --git a/demos/crossroad_camera_demo/crossroad_camera_demo.hpp b/demos/crossroad_camera_demo/crossroad_camera_demo.hpp
index d5fcf5973af..184b25b3a6a 100644
--- a/demos/crossroad_camera_demo/crossroad_camera_demo.hpp
+++ b/demos/crossroad_camera_demo/crossroad_camera_demo.hpp
@@ -9,120 +9,58 @@
 #include <vector>
 #include <gflags/gflags.h>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
 static const char video_message[] = "Required. Path to a video or image file. Default value is \"cam\" to work with camera.";
-
-/// @brief message for model argument
 static const char person_vehicle_bike_detection_model_message[] = "Required. Path to the Person/Vehicle/Bike Detection Crossroad model (.xml) file.";
 static const char person_attribs_model_message[] = "Optional. Path to the Person Attributes Recognition Crossroad model (.xml) file.";
 static const char person_reid_model_message[] = "Optional. Path to the Person Reidentification Retail model (.xml) file.";
-
-/// @brief message for assigning Person/Vehicle/Bike detection inference to device
-static const char target_device_message[] = "Optional. Specify the target device for Person/Vehicle/Bike Detection. " \
-                                            "The list of available devices is shown below. Default value is CPU. " \
-                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message[] = "Optional. Specify the target device for Person/Vehicle/Bike Detection. "
+                                            "The list of available devices is shown below. Default value is CPU. "
+                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                             "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for assigning Person attributes recognition inference to device
-static const char target_device_message_person_attribs[] = "Optional. Specify the target device for Person Attributes Recognition. "\
-                                                            "The list of available devices is shown below. Default value is CPU. " \
-                                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_person_attribs[] = "Optional. Specify the target device for Person Attributes Recognition. "
+                                                            "The list of available devices is shown below. Default value is CPU. "
+                                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                             "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for assigning Person Reidentification retail inference to device
-static const char target_device_message_person_reid[] = "Optional. Specify the target device for Person Reidentification Retail. "\
-                                                        "The list of available devices is shown below. Default value is CPU. " \
-                                                        "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_person_reid[] = "Optional. Specify the target device for Person Reidentification Retail. "
+                                                        "The list of available devices is shown below. Default value is CPU. "
+                                                        "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                         "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for performance counters
 static const char performance_counter_message[] = "Optional. Enables per-layer performance statistics.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Optional. For clDNN (GPU)-targeted custom kernels, if any. "\
-"Absolute path to the xml file with the kernels desc.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Optional. For MKLDNN (CPU)-targeted custom layers, if any. " \
-"Absolute path to a shared library with the kernels impl.";
-
-/// @brief message for probability threshold argument for person/vehicle/bike crossroad detections
+static const char custom_cldnn_message[] = "Optional. For clDNN (GPU)-targeted custom kernels, if any. "
+                                           "Absolute path to the xml file with the kernels desc.";
+static const char custom_cpu_library_message[] = "Optional. For MKLDNN (CPU)-targeted custom layers, if any. "
+                                                 "Absolute path to a shared library with the kernels impl.";
 static const char threshold_output_message[] = "Optional. Probability threshold for person/vehicle/bike crossroad detections.";
-
-/// @brief message for probability threshold argument for person/vehicle/bike crossroad detections
 static const char threshold_output_message_person_reid[] = "Optional. Cosine similarity threshold between two vectors for person reidentification.";
-
-/// @brief message raw output flag
 static const char raw_output_message[] = "Optional. Output Inference results as raw values.";
-
-/// @brief message no show processed video
 static const char no_show_processed_video[] = "Optional. No show processed video.";
-
-/// @brief message resizable input flag
 static const char input_resizable_message[] = "Optional. Enables resizable input with support of ROI crop & auto resize.";
 
+/// @brief Message list of monitors to show
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// @brief Define flag for showing help message <br>
-DEFINE_bool(h, false, help_message);
 
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
+DEFINE_bool(h, false, help_message);
 DEFINE_string(i, "cam", video_message);
-
-/// @brief Define parameter for vehicle detection  model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", person_vehicle_bike_detection_model_message);
-
-/// @brief Define parameter for vehicle attributes model file <br>
-/// It is a required parameter
 DEFINE_string(m_pa, "", person_attribs_model_message);
-
-/// @brief Define parameter for vehicle detection  model file <br>
-/// It is a required parameter
 DEFINE_string(m_reid, "", person_reid_model_message);
-
-/// @brief device the target device for vehicle detection infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief device the target device for age gender detection on <br>
 DEFINE_string(d_pa, "CPU", target_device_message_person_attribs);
-
-/// @brief device the target device for head pose detection on <br>
 DEFINE_string(d_reid, "CPU", target_device_message_person_reid);
-
-/// @brief Enable per-layer performance report
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// @brief Define probability threshold for person/vehicle/bike crossroad detections <br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, threshold_output_message);
-
-/// @brief Define probability threshold for person/vehicle/bike crossroad detections <br>
-/// It is an optional parameter
 DEFINE_double(t_reid, 0.7, threshold_output_message_person_reid);
-
-/// @brief Flag to disable processed video showing<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
+DEFINE_bool(auto_resize, false, input_resizable_message);
 
-/// \brief Enables resizable input<br>
+/// \brief Define a flag to show monitors<br>
 /// It is an optional parameter
-DEFINE_bool(auto_resize, false, input_resizable_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 
 /**
@@ -150,4 +88,5 @@ static void showUsage() {
     std::cout << "    -t_reid                      " << threshold_output_message_person_reid << std::endl;
     std::cout << "    -no_show                     " << no_show_processed_video << std::endl;
     std::cout << "    -auto_resize                 " << input_resizable_message << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/crossroad_camera_demo/main.cpp b/demos/crossroad_camera_demo/main.cpp
index 82bd63b69ba..cd83821a38c 100644
--- a/demos/crossroad_camera_demo/main.cpp
+++ b/demos/crossroad_camera_demo/main.cpp
@@ -23,12 +23,10 @@
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/slog.hpp>
 #include <samples/ocv_common.hpp>
 #include "crossroad_camera_demo.hpp"
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 using namespace InferenceEngine;
 
@@ -66,13 +64,13 @@ struct BaseDetection {
     std::string inputName;
     std::string outputName;
 
-    BaseDetection(std::string &commandLineFlag, std::string topoName)
+    BaseDetection(std::string &commandLineFlag, const std::string &topoName)
             : commandLineFlag(commandLineFlag), topoName(topoName) {}
 
     ExecutableNetwork * operator ->() {
         return &net;
     }
-    virtual CNNNetwork read()  = 0;
+    virtual CNNNetwork read(const Core& ie)  = 0;
 
     virtual void setRoiBlob(const Blob::Ptr &roiBlob) {
         if (!enabled())
@@ -160,23 +158,19 @@ struct PersonDetection : BaseDetection{
     }
 
     PersonDetection() : BaseDetection(FLAGS_m, "Person Detection"), maxProposalCount(0), objectSize(0) {}
-    CNNNetwork read() override {
+    CNNNetwork read(const Core& ie) override {
         slog::info << "Loading network files for PersonDetection" << slog::endl;
-        CNNNetReader netReader;
         /** Read network model **/
-        netReader.ReadNetwork(FLAGS_m);
+        auto network = ie.ReadNetwork(FLAGS_m);
         /** Set batch size to 1 **/
         slog::info << "Batch size is forced to  1" << slog::endl;
-        netReader.getNetwork().setBatchSize(1);
-        /** Extract model name and load it's weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        netReader.ReadWeights(binFileName);
+        network.setBatchSize(1);
         // -----------------------------------------------------------------------------------------------------
 
         /** SSD-based network should have one input and one output **/
         // ---------------------------Check inputs ------------------------------------------------------
         slog::info << "Checking Person Detection inputs" << slog::endl;
-        InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(network.getInputsInfo());
         if (inputInfo.size() != 1) {
             throw std::logic_error("Person Detection network should have only one input");
         }
@@ -194,7 +188,7 @@ struct PersonDetection : BaseDetection{
 
         // ---------------------------Check outputs ------------------------------------------------------
         slog::info << "Checking Person Detection outputs" << slog::endl;
-        OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        OutputsDataMap outputInfo(network.getOutputsInfo());
         if (outputInfo.size() != 1) {
             throw std::logic_error("Person Detection network should have only one output");
         }
@@ -213,7 +207,7 @@ struct PersonDetection : BaseDetection{
         _output->setLayout(Layout::NCHW);
 
         slog::info << "Loading Person Detection model to the "<< FLAGS_d << " device" << slog::endl;
-        return netReader.getNetwork();
+        return network;
     }
 
     void fetchResults() {
@@ -282,22 +276,19 @@ struct PersonAttribsDetection : BaseDetection {
                     10, cv::KMEANS_RANDOM_CENTERS, centers);
         centers.convertTo(centers, CV_8U);
         centers = centers.reshape(0, clusterCount);
-        std::map<int, cv::Vec3b, std::greater<int>> max_color;
         std::vector<int> freq(clusterCount);
 
         for (int i = 0; i < labels.rows * labels.cols; ++i) {
             freq[labels.at<int>(i)]++;
         }
 
-        for (size_t i = 0; i < freq.size(); ++i) {
-            max_color[freq[i]] = centers.at<cv::Vec3b>(i);
-        }
+        auto freqArgmax = std::max_element(freq.begin(), freq.end()) - freq.begin();
 
-        return max_color.begin()->second;
+        return centers.at<cv::Vec3b>(freqArgmax);
     }
 
     AttributesAndColorPoints GetPersonAttributes() {
-        static const std::vector<std::string> attributesVec = {
+        static const char *const attributeStrings[] = {
                 "is male", "has_bag", "has_backpack" , "has hat", "has longsleeves", "has longpants", "has longhair", "has coat_jacket"
         };
 
@@ -308,10 +299,10 @@ struct PersonAttribsDetection : BaseDetection {
         size_t numOfTCPointChannels = topColorPointBlob->getTensorDesc().getDims().at(1);
         size_t numOfBCPointChannels = bottomColorPointBlob->getTensorDesc().getDims().at(1);
 
-        if (numOfAttrChannels != attributesVec.size()) {
+        if (numOfAttrChannels != arraySize(attributeStrings)) {
             throw std::logic_error("Output size (" + std::to_string(numOfAttrChannels) + ") of the "
-                                   "Person Attributes Recognition network is not equal to used person "
-                                   "attributes vector size (" + std::to_string(attributesVec.size()) + ")");
+                                   "Person Attributes Recognition network is not equal to expected "
+                                   "number of attributes (" + std::to_string(arraySize(attributeStrings)) + ")");
         }
         if (numOfTCPointChannels != 2) {
             throw std::logic_error("Output size (" + std::to_string(numOfTCPointChannels) + ") of the "
@@ -334,31 +325,27 @@ struct PersonAttribsDetection : BaseDetection {
         returnValue.bottom_color_point.x = outputBCPointValues[0];
         returnValue.bottom_color_point.y = outputBCPointValues[1];
 
-        for (size_t i = 0; i < attributesVec.size(); i++) {
-            returnValue.attributes_strings.push_back(attributesVec[i]);
+        for (size_t i = 0; i < arraySize(attributeStrings); i++) {
+            returnValue.attributes_strings.push_back(attributeStrings[i]);
             returnValue.attributes_indicators.push_back(outputAttrValues[i] > 0.5);
         }
 
         return returnValue;
     }
 
-    CNNNetwork read() override {
+    CNNNetwork read(const Core& ie) override {
         slog::info << "Loading network files for PersonAttribs" << slog::endl;
-        CNNNetReader netReader;
         /** Read network model **/
-        netReader.ReadNetwork(FLAGS_m_pa);
-        netReader.getNetwork().setBatchSize(1);
-        slog::info << "Batch size is forced to 1 for Person Attribs" << slog::endl;
-
+        auto network = ie.ReadNetwork(FLAGS_m_pa);
         /** Extract model name and load it's weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m_pa) + ".bin";
-        netReader.ReadWeights(binFileName);
+        network.setBatchSize(1);
+        slog::info << "Batch size is forced to 1 for Person Attribs" << slog::endl;
         // -----------------------------------------------------------------------------------------------------
 
         /** Person Attribs network should have one input two outputs **/
         // ---------------------------Check inputs ------------------------------------------------------
         slog::info << "Checking PersonAttribs inputs" << slog::endl;
-        InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(network.getInputsInfo());
         if (inputInfo.size() != 1) {
             throw std::logic_error("Person Attribs topology should have only one input");
         }
@@ -375,7 +362,7 @@ struct PersonAttribsDetection : BaseDetection {
 
         // ---------------------------Check outputs ------------------------------------------------------
         slog::info << "Checking Person Attribs outputs" << slog::endl;
-        OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        OutputsDataMap outputInfo(network.getOutputsInfo());
         if (outputInfo.size() != 3) {
              throw std::logic_error("Person Attribs Network expects networks having one output");
         }
@@ -385,7 +372,7 @@ struct PersonAttribsDetection : BaseDetection {
         outputNameForBottomColorPoint = (it++)->second->getName();  // bottom color location
         slog::info << "Loading Person Attributes Recognition model to the "<< FLAGS_d_pa << " device" << slog::endl;
         _enabled = true;
-        return netReader.getNetwork();
+        return network;
     }
 };
 
@@ -395,12 +382,11 @@ struct PersonReIdentification : BaseDetection {
     PersonReIdentification() : BaseDetection(FLAGS_m_reid, "Person Reidentification Retail") {}
 
     unsigned long int findMatchingPerson(const std::vector<float> &newReIdVec) {
-        float cosSim;
         auto size = globalReIdVec.size();
 
         /* assigned REID is index of the matched vector from the globalReIdVec */
         for (size_t i = 0; i < size; ++i) {
-            cosSim = cosineSimilarity(newReIdVec, globalReIdVec[i]);
+            float cosSim = cosineSimilarity(newReIdVec, globalReIdVec[i]);
             if (FLAGS_r) {
                 std::cout << "cosineSimilarity: " << cosSim << std::endl;
             }
@@ -419,14 +405,8 @@ struct PersonReIdentification : BaseDetection {
         Blob::Ptr attribsBlob = request.GetBlob(outputName);
 
         auto numOfChannels = attribsBlob->getTensorDesc().getDims().at(1);
-        /* output descriptor of Person Reidentification Recognition network has size 256 */
-        if (numOfChannels != 256) {
-            throw std::logic_error("Output size (" + std::to_string(numOfChannels) + ") of the "
-                                   "Person Reidentification network is not equal to 256");
-        }
-
         auto outputValues = attribsBlob->buffer().as<float*>();
-        return std::vector<float>(outputValues, outputValues + 256);
+        return std::vector<float>(outputValues, outputValues + numOfChannels);
     }
 
     template <typename T>
@@ -453,21 +433,16 @@ struct PersonReIdentification : BaseDetection {
         return mul / (sqrt(denomA) * sqrt(denomB));
     }
 
-    CNNNetwork read() override {
+    CNNNetwork read(const Core& ie) override {
         slog::info << "Loading network files for Person Reidentification" << slog::endl;
-        CNNNetReader netReader;
         /** Read network model **/
-        netReader.ReadNetwork(FLAGS_m_reid);
+        auto network = ie.ReadNetwork(FLAGS_m_reid);
         slog::info << "Batch size is forced to  1 for Person Reidentification Network" << slog::endl;
-        netReader.getNetwork().setBatchSize(1);
-        /** Extract model name and load it's weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m_reid) + ".bin";
-        netReader.ReadWeights(binFileName);
-
+        network.setBatchSize(1);
         /** Person Reidentification network should have 1 input and one output **/
         // ---------------------------Check inputs ------------------------------------------------------
         slog::info << "Checking Person Reidentification Network input" << slog::endl;
-        InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(network.getInputsInfo());
         if (inputInfo.size() != 1) {
             throw std::logic_error("Person Reidentification Retail should have 1 input");
         }
@@ -484,7 +459,7 @@ struct PersonReIdentification : BaseDetection {
 
         // ---------------------------Check outputs ------------------------------------------------------
         slog::info << "Checking Person Reidentification Network output" << slog::endl;
-        OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        OutputsDataMap outputInfo(network.getOutputsInfo());
         if (outputInfo.size() != 1) {
             throw std::logic_error("Person Reidentification Network should have 1 output");
         }
@@ -492,7 +467,7 @@ struct PersonReIdentification : BaseDetection {
         slog::info << "Loading Person Reidentification Retail model to the "<< FLAGS_d_reid << " device" << slog::endl;
 
         _enabled = true;
-        return netReader.getNetwork();
+        return network;
     }
 };
 
@@ -502,7 +477,7 @@ struct Load {
 
     void into(Core & ie, const std::string & deviceName) const {
         if (detector.enabled()) {
-            detector.net = ie.LoadNetwork(detector.read(), deviceName);
+            detector.net = ie.LoadNetwork(detector.read(ie), deviceName);
         }
     }
 };
@@ -559,10 +534,6 @@ int main(int argc, char *argv[]) {
             std::cout << ie.GetVersions(flag) << std::endl;
 
             if ((flag.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-                /** Load default extensions lib for the CPU device (e.g. SSD's DetectionOutput)**/
-                ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
                 if (!FLAGS_l.empty()) {
                     // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
                     auto extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -608,6 +579,9 @@ int main(int argc, char *argv[]) {
         }
         std::cout << std::endl;
 
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, static_cast<int>(cap.get(cv::CAP_PROP_FRAME_HEIGHT)) - graphSize.height - 10, graphSize);
+
         do {
             // get and enqueue the next frame (in case of video)
             if (isVideo && !cap.read(frame)) {
@@ -780,6 +754,8 @@ int main(int argc, char *argv[]) {
                 }
             }
 
+            presenter.drawGraphs(frame);
+
             // --------------------------- Execution statistics ------------------------------------------------
             std::ostringstream out;
             out << "Person detection time  : " << std::fixed << std::setprecision(2) << detection.count()
@@ -820,6 +796,7 @@ int main(int argc, char *argv[]) {
                 const int key = cv::waitKey(isVideo ? 1 : 0);
                 if (27 == key)  // Esc
                     break;
+                presenter.handleKey(key);
             }
         } while (isVideo);
 
@@ -843,6 +820,8 @@ int main(int argc, char *argv[]) {
                 personReId.printPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_reid));
             }
         }
+
+        std::cout << presenter.reportMeans() << '\n';
         // -----------------------------------------------------------------------------------------------------
     }
     catch (const std::exception& error) {
diff --git a/demos/gaze_estimation_demo/CMakeLists.txt b/demos/gaze_estimation_demo/CMakeLists.txt
index 02f7d4e0459..deece6f776b 100644
--- a/demos/gaze_estimation_demo/CMakeLists.txt
+++ b/demos/gaze_estimation_demo/CMakeLists.txt
@@ -9,4 +9,5 @@ ie_add_sample(NAME gaze_estimation_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
               INCLUDE_DIRECTORIES "${CMAKE_CURRENT_SOURCE_DIR}/include"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)        
diff --git a/demos/gaze_estimation_demo/README.md b/demos/gaze_estimation_demo/README.md
index e6d5d594128..ed49233bd54 100644
--- a/demos/gaze_estimation_demo/README.md
+++ b/demos/gaze_estimation_demo/README.md
@@ -27,7 +27,7 @@ Other demo objectives are:
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./gaze_estimation_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -52,6 +52,7 @@ Options:
     -pc                      Optional. Enable per-layer performance report.
     -r                       Optional. Output inference results as raw values.
     -t                       Optional. Probability threshold for Face Detector. The default value is 0.5.
+    -u                       Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields an error message.
diff --git a/demos/gaze_estimation_demo/gaze_estimation_demo.hpp b/demos/gaze_estimation_demo/gaze_estimation_demo.hpp
index fac7ee02444..eadacdfe12d 100644
--- a/demos/gaze_estimation_demo/gaze_estimation_demo.hpp
+++ b/demos/gaze_estimation_demo/gaze_estimation_demo.hpp
@@ -16,118 +16,51 @@
 #include <dirent.h>
 #endif
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief Message for images argument
 static const char video_message[] = "Optional. Path to a video file. Default value is \"cam\" to work with camera.";
-
-/// @brief message for model argument
 static const char gaze_estimation_model_message[] = "Required. Path to an .xml file with a trained Gaze Estimation model.";
 static const char face_detection_model_message[] = "Required. Path to an .xml file with a trained Face Detection model.";
 static const char head_pose_model_message[] = "Required. Path to an .xml file with a trained Head Pose Estimation model.";
 static const char facial_landmarks_model_message[] = "Required. Path to an .xml file with a trained Facial Landmarks Estimation model.";
-
-/// @brief Message for plugin argument
-static const char plugin_message[] = "Plugin name. For example, CPU. If this parameter is specified, " \
-"the demo will look for this plugin only.";
-
-/// @brief Message for assigning gaze calculation to device
-static const char target_device_message[] = "Optional. Target device for Gaze Estimation network (the list of available devices is shown below). " \
-"Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
-
-/// @brief Message for assigning face detection calculation to device
-static const char target_device_message_fd[] = "Optional. Target device for Face Detection network (the list of available devices is shown below). " \
-"Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
-
-/// @brief Message for assigning head pose calculation to device
-static const char target_device_message_hp[] = "Optional. Target device for Head Pose Estimation network (the list of available devices is shown below). " \
-"Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
-
-/// @brief Message for assigning facial landmarks calculation to device
-static const char target_device_message_lm[] = "Optional. Target device for Facial Landmarks Estimation network " \
-"(the list of available devices is shown below). Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for device specified. Default value is \"CPU\".";
-
-/// @brief Message for assigning setting resolution of camera
+static const char plugin_message[] = "Plugin name. For example, CPU. If this parameter is specified, "
+                                     "the demo will look for this plugin only.";
+static const char target_device_message[] = "Optional. Target device for Gaze Estimation network (the list of available devices is shown below). "
+                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
+static const char target_device_message_fd[] = "Optional. Target device for Face Detection network (the list of available devices is shown below). "
+                                               "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
+static const char target_device_message_hp[] = "Optional. Target device for Head Pose Estimation network (the list of available devices is shown below). "
+                                               "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for a specified device. Default value is \"CPU\".";
+static const char target_device_message_lm[] = "Optional. Target device for Facial Landmarks Estimation network "
+                                               "(the list of available devices is shown below). Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for device specified. Default value is \"CPU\".";
 static const char camera_resolution_message[] = "Optional. Set camera resolution in format WxH.";
-
-/// @brief Message for performance counters
 static const char performance_counter_message[] = "Optional. Enable per-layer performance report.";
-
-/// @brief Message for probability threshold argument
 static const char thresh_output_message[] = "Optional. Probability threshold for Face Detector. The default value is 0.5.";
-
-/// @brief Message raw output flag
 static const char raw_output_message[] = "Optional. Output inference results as raw values.";
-
-/// @brief Message for enabling Face Detector network reshape
 static const char fd_reshape_message[] = "Optional. Reshape Face Detector network so that its input resolution has the same aspect ratio as the input frame.";
-
-/// @brief Message do not show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// \brief Define flag for showing help message<br>
 DEFINE_bool(h, false, help_message);
-
-/// \brief Define parameter for set image file<br>
-/// It is a required parameter
 DEFINE_string(i, "cam", video_message);
-
-/// \brief Define parameter for Gaze Estimation model file<br>
-/// It is a required parameter
 DEFINE_string(m, "", gaze_estimation_model_message);
-
-/// \brief Define parameter for Face Detection model file<br>
-/// It is a required parameter
 DEFINE_string(m_fd, "", face_detection_model_message);
-
-/// \brief Define parameter for Head Pose Estimation model file<br>
-/// It is a required parameter
 DEFINE_string(m_hp, "", head_pose_model_message);
-
-/// \brief Define parameter for Facial Landmarks Estimation model file<br>
-/// It is an optional parameter
 DEFINE_string(m_lm, "", facial_landmarks_model_message);
-
-/// \brief target device for Gaze Estimation network<br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief Define parameter for target device for Face Detection network<br>
 DEFINE_string(d_fd, "CPU", target_device_message_fd);
-
-/// \brief Define parameter for target device for Head Pose Estimation network<br>
 DEFINE_string(d_hp, "CPU", target_device_message_hp);
-
-/// \brief Define parameter for target device for Facial Landmarks Estimation network<br>
 DEFINE_string(d_lm, "CPU", target_device_message_lm);
-
-/// \brief Define parameter camera resolution<br>
-/// It is an optional parameter
 DEFINE_string(res, "", camera_resolution_message);
-
-/// \brief Define parameter to enable face detector network reshape<br>
-/// It is an optional parameter
 DEFINE_bool(fd_reshape, false, fd_reshape_message);
-
-/// \brief Define parameter to enable per-layer performance report<br>
-/// It is an optional parameter
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// \brief Define a flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// \brief Define a parameter for probability threshold for detections<br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, thresh_output_message);
-
-/// \brief Define a flag to disable showing processed video<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * \brief This function shows a help message
@@ -154,4 +87,5 @@ static void showUsage() {
     std::cout << "    -pc                      " << performance_counter_message << std::endl;
     std::cout << "    -r                       " << raw_output_message << std::endl;
     std::cout << "    -t                       " << thresh_output_message << std::endl;
+    std::cout << "    -u                       " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/gaze_estimation_demo/include/face_detector.hpp b/demos/gaze_estimation_demo/include/face_detector.hpp
index 7c13b4d766f..53d13388b57 100644
--- a/demos/gaze_estimation_demo/include/face_detector.hpp
+++ b/demos/gaze_estimation_demo/include/face_detector.hpp
@@ -28,6 +28,11 @@ class FaceDetector {
 
 private:
     IEWrapper ieWrapper;
+    std::string inputBlobName;
+    std::vector<unsigned long> inputBlobDims;
+    std::string outputBlobName;
+    std::size_t numTotalDetections;
+
     double detectionThreshold;
     bool enableReshape;
 
diff --git a/demos/gaze_estimation_demo/include/gaze_estimator.hpp b/demos/gaze_estimation_demo/include/gaze_estimator.hpp
index e025fae96ca..143928152ea 100644
--- a/demos/gaze_estimation_demo/include/gaze_estimator.hpp
+++ b/demos/gaze_estimation_demo/include/gaze_estimator.hpp
@@ -26,6 +26,7 @@ class GazeEstimator: public BaseEstimator {
 
 private:
     IEWrapper ieWrapper;
+    std::string outputBlobName;
     bool rollAlign;
     cv::Rect createEyeBoundingBox(const cv::Point2i& p1, const cv::Point2i& p2, float scale = 1.8) const;
     void rotateImageAroundCenter(const cv::Mat& srcImage, cv::Mat& dstImage, float angle) const;
diff --git a/demos/gaze_estimation_demo/include/head_pose_estimator.hpp b/demos/gaze_estimation_demo/include/head_pose_estimator.hpp
index 1d5f2e4d212..96cc396fbaa 100644
--- a/demos/gaze_estimation_demo/include/head_pose_estimator.hpp
+++ b/demos/gaze_estimation_demo/include/head_pose_estimator.hpp
@@ -25,5 +25,6 @@ class HeadPoseEstimator: public BaseEstimator {
 
 private:
     IEWrapper ieWrapper;
+    std::string inputBlobName;
 };
 }  // namespace gaze_estimation
diff --git a/demos/gaze_estimation_demo/include/ie_wrapper.hpp b/demos/gaze_estimation_demo/include/ie_wrapper.hpp
index 6e755c898e2..ce5f43b4105 100644
--- a/demos/gaze_estimation_demo/include/ie_wrapper.hpp
+++ b/demos/gaze_estimation_demo/include/ie_wrapper.hpp
@@ -30,16 +30,19 @@ class IEWrapper {
     // For setting input blobs containing vectors of data
     void setInputBlob(const std::string& blobName, const std::vector<float>& data);
 
-    // Get output blob content as a vector given its name (if there are more than one output blob)
+    // Get output blob content as a vector given its name
     void getOutputBlob(const std::string& blobName, std::vector<float>& output);
-    // Get output blob content as a vector (if there is only one output blob)
-    void getOutputBlob(std::vector<float>& output);
 
     void printPerlayerPerformance() const;
 
-    const std::map<std::string, std::vector<unsigned long>>& getIputBlobDimsInfo() const;
+    const std::map<std::string, std::vector<unsigned long>>& getInputBlobDimsInfo() const;
     const std::map<std::string, std::vector<unsigned long>>& getOutputBlobDimsInfo() const;
 
+    std::string expectSingleInput() const;
+    std::string expectSingleOutput() const;
+
+    void expectImageInput(const std::string& blobName) const;
+
     void reshape(const std::map<std::string, std::vector<unsigned long>>& newBlobsDimsInfo);
 
     void infer();
@@ -48,7 +51,6 @@ class IEWrapper {
     std::string modelPath;
     std::string deviceName;
     InferenceEngine::Core& ie;
-    InferenceEngine::CNNNetReader netReader;
     InferenceEngine::CNNNetwork network;
     InferenceEngine::ExecutableNetwork executableNetwork;
     InferenceEngine::InferRequest request;
diff --git a/demos/gaze_estimation_demo/include/landmarks_estimator.hpp b/demos/gaze_estimation_demo/include/landmarks_estimator.hpp
index ed834a8589b..f65ab817a2d 100644
--- a/demos/gaze_estimation_demo/include/landmarks_estimator.hpp
+++ b/demos/gaze_estimation_demo/include/landmarks_estimator.hpp
@@ -25,5 +25,6 @@ class LandmarksEstimator: public BaseEstimator {
 
 private:
     IEWrapper ieWrapper;
+    std::string inputBlobName, outputBlobName;
 };
 }  // namespace gaze_estimation
diff --git a/demos/gaze_estimation_demo/main.cpp b/demos/gaze_estimation_demo/main.cpp
index e3bb7cef3d6..e0df0025241 100644
--- a/demos/gaze_estimation_demo/main.cpp
+++ b/demos/gaze_estimation_demo/main.cpp
@@ -28,6 +28,7 @@
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
 
@@ -49,9 +50,6 @@
 #include "utils.hpp"
 
 #include <ie_iextension.h>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 using namespace InferenceEngine;
 using namespace gaze_estimation;
@@ -140,8 +138,8 @@ int main(int argc, char *argv[]) {
         LandmarksEstimator landmarksEstimator(ie, FLAGS_m_lm, FLAGS_d_lm);
         GazeEstimator gazeEstimator(ie, FLAGS_m, FLAGS_d);
 
-        // Put pointers to all estimators in a vector so that they could be processed uniformly in a loop
-        std::vector<BaseEstimator*> estimators = {&headPoseEstimator, &landmarksEstimator, &gazeEstimator};
+        // Put pointers to all estimators in an array so that they could be processed uniformly in a loop
+        BaseEstimator* estimators[] = {&headPoseEstimator, &landmarksEstimator, &gazeEstimator};
 
         // Each element of the vector contains inference results on one face
         std::vector<FaceInferenceResults> inferenceResults;
@@ -153,7 +151,8 @@ int main(int argc, char *argv[]) {
 
         int delay = 1;
         std::string windowName = "Gaze estimation demo";
-        double overallTime = 0., inferenceTime = 0.;
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, static_cast<int>(cap.get(cv::CAP_PROP_FRAME_HEIGHT)) - graphSize.height - 10, graphSize);
         auto tIterationBegins = cv::getTickCount();
         do {
             if (flipImage) {
@@ -172,11 +171,11 @@ int main(int argc, char *argv[]) {
 
             // Measure FPS
             auto tIterationEnds = cv::getTickCount();
-            overallTime = (tIterationEnds - tIterationBegins) * 1000. / cv::getTickFrequency();
+            double overallTime = (tIterationEnds - tIterationBegins) * 1000. / cv::getTickFrequency();
             overallTimeAverager.updateValue(overallTime);
             tIterationBegins = tIterationEnds;
 
-            inferenceTime = (tInferenceEnds - tInferenceBegins) * 1000. / cv::getTickFrequency();
+            double inferenceTime = (tInferenceEnds - tInferenceBegins) * 1000. / cv::getTickFrequency();
             inferenceTimeAverager.updateValue(inferenceTime);
 
             if (FLAGS_pc) {
@@ -196,6 +195,8 @@ int main(int argc, char *argv[]) {
                 continue;
             }
 
+            presenter.drawGraphs(frame);
+
             // Display the results
             for (auto const& inferenceResult : inferenceResults) {
                 resultsMarker.mark(frame, inferenceResult);
@@ -213,7 +214,10 @@ int main(int argc, char *argv[]) {
                 break;
             else if (key == 'f')
                 flipImage = !flipImage;
+            else
+                presenter.handleKey(key);
         } while (cap.read(frame));
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         slog::err << error.what() << slog::endl;
diff --git a/demos/gaze_estimation_demo/src/face_detector.cpp b/demos/gaze_estimation_demo/src/face_detector.cpp
index 75de6ad8fd7..8bc190ae0d7 100644
--- a/demos/gaze_estimation_demo/src/face_detector.cpp
+++ b/demos/gaze_estimation_demo/src/face_detector.cpp
@@ -19,6 +19,22 @@ FaceDetector::FaceDetector(InferenceEngine::Core& ie,
              ieWrapper(ie, modelPath, deviceName),
              detectionThreshold(detectionConfidenceThreshold),
              enableReshape(enableReshape) {
+    const auto& inputInfo = ieWrapper.getInputBlobDimsInfo();
+
+    inputBlobName = ieWrapper.expectSingleInput();
+    ieWrapper.expectImageInput(inputBlobName);
+    inputBlobDims = inputInfo.at(inputBlobName);
+
+    const auto& outputInfo = ieWrapper.getOutputBlobDimsInfo();
+
+    outputBlobName = ieWrapper.expectSingleOutput();
+    const auto& outputBlobDims = outputInfo.at(outputBlobName);
+
+    if (outputBlobDims.size() != 4 || outputBlobDims[0] != 1 || outputBlobDims[1] != 1 || outputBlobDims[3] != 7) {
+        throw std::runtime_error(modelPath + ": expected \"" + outputBlobName + "\" to have shape 1x1xNx7");
+    }
+
+    numTotalDetections = outputBlobDims[2];
 }
 
 void FaceDetector::adjustBoundingBox(cv::Rect& boundingBox) const {
@@ -45,10 +61,6 @@ void FaceDetector::adjustBoundingBox(cv::Rect& boundingBox) const {
 std::vector<FaceInferenceResults> FaceDetector::detect(const cv::Mat& image) {
     std::vector<FaceInferenceResults> detectionResult;
 
-    auto ieInputBlobInfo = ieWrapper.getIputBlobDimsInfo().begin();
-    auto inputBlobName = ieInputBlobInfo->first;
-    auto inputBlobDims = ieInputBlobInfo->second;
-
     if (enableReshape) {
         double imageAspectRatio = std::round(100. * image.cols / image.rows) / 100.;
         double networkAspectRatio = std::round(100. * inputBlobDims[3] / inputBlobDims[2]) / 100.;
@@ -56,12 +68,11 @@ std::vector<FaceInferenceResults> FaceDetector::detect(const cv::Mat& image) {
 
          if (std::fabs(imageAspectRatio - networkAspectRatio) > aspectRatioThreshold) {
             std::cout << "Face Detection network is reshaped" << std::endl;
-            std::map<std::string, std::vector<unsigned long>> newBlobsDimsInfo;
-            auto newBlobDims(inputBlobDims);
+
             // Fix height and change width to make networkAspectRatio equal to imageAspectRatio
-            newBlobDims[3] = static_cast<unsigned long>(newBlobDims[2] * imageAspectRatio);
-            newBlobsDimsInfo[inputBlobName] = newBlobDims;
-            ieWrapper.reshape(newBlobsDimsInfo);
+            inputBlobDims[3] = static_cast<unsigned long>(inputBlobDims[2] * imageAspectRatio);
+
+            ieWrapper.reshape({{inputBlobName, inputBlobDims}});
         }
     }
 
@@ -69,27 +80,23 @@ std::vector<FaceInferenceResults> FaceDetector::detect(const cv::Mat& image) {
     ieWrapper.infer();
 
     std::vector<float> rawDetectionResults;
-    ieWrapper.getOutputBlob(rawDetectionResults);
-    auto outputBlobDims = ieWrapper.getOutputBlobDimsInfo().begin()->second;
-
-    auto nTotalDetections = outputBlobDims[2];
-    auto nInfoFields = outputBlobDims[3];
+    ieWrapper.getOutputBlob(outputBlobName, rawDetectionResults);
 
     FaceInferenceResults tmp;
 
     cv::Size imageSize(image.size());
     cv::Rect imageRect(0, 0, image.cols, image.rows);
 
-    for (unsigned long detectionID = 0; detectionID < nTotalDetections; ++detectionID) {
-        float confidence = rawDetectionResults[detectionID * nInfoFields + 2];
+    for (unsigned long detectionID = 0; detectionID < numTotalDetections; ++detectionID) {
+        float confidence = rawDetectionResults[detectionID * 7 + 2];
         if (static_cast<double>(confidence) < detectionThreshold) {
             break;
         }
 
-        auto x = rawDetectionResults[detectionID * nInfoFields + 3] * imageSize.width;
-        auto width = rawDetectionResults[detectionID * nInfoFields + 5] * imageSize.width - x;
-        auto y = rawDetectionResults[detectionID * nInfoFields + 4] * imageSize.height;
-        auto height = rawDetectionResults[detectionID * nInfoFields + 6] * imageSize.height - y;
+        auto x = rawDetectionResults[detectionID * 7 + 3] * imageSize.width;
+        auto width = rawDetectionResults[detectionID * 7 + 5] * imageSize.width - x;
+        auto y = rawDetectionResults[detectionID * 7 + 4] * imageSize.height;
+        auto height = rawDetectionResults[detectionID * 7 + 6] * imageSize.height - y;
 
         cv::Rect faceRect(static_cast<int>(x), static_cast<int>(y),
                           static_cast<int>(width), static_cast<int>(height));
diff --git a/demos/gaze_estimation_demo/src/gaze_estimator.cpp b/demos/gaze_estimation_demo/src/gaze_estimator.cpp
index 3e12fc3ac78..d84828b27ce 100644
--- a/demos/gaze_estimation_demo/src/gaze_estimator.cpp
+++ b/demos/gaze_estimation_demo/src/gaze_estimator.cpp
@@ -9,11 +9,42 @@
 #include "gaze_estimator.hpp"
 
 namespace gaze_estimation {
+
+const char BLOB_HEAD_POSE_ANGLES[] = "head_pose_angles";
+const char BLOB_LEFT_EYE_IMAGE[] = "left_eye_image";
+const char BLOB_RIGHT_EYE_IMAGE[] = "right_eye_image";
+
 GazeEstimator::GazeEstimator(InferenceEngine::Core& ie,
                              const std::string& modelPath,
                              const std::string& deviceName,
                              bool doRollAlign):
                ieWrapper(ie, modelPath, deviceName), rollAlign(doRollAlign) {
+    const auto& inputInfo = ieWrapper.getInputBlobDimsInfo();
+
+    for (const auto& blobName: {BLOB_HEAD_POSE_ANGLES, BLOB_LEFT_EYE_IMAGE, BLOB_RIGHT_EYE_IMAGE}) {
+        if (inputInfo.find(blobName) == inputInfo.end())
+            throw std::runtime_error(modelPath + ": expected to have input named \"" + blobName + "\"");
+    }
+
+    auto expectAngles = [&modelPath](const std::string& blobName, const std::vector<unsigned long>& dims) {
+        bool is1Dim = !dims.empty()
+            && std::all_of(dims.begin(), dims.end() - 1, [](unsigned long n) { return n == 1; });
+
+        if (!is1Dim || dims.back() != 3) {
+            throw std::runtime_error(modelPath + ": expected \"" + blobName + "\" to have dimensions [1x...]3");
+        }
+    };
+
+    expectAngles(BLOB_HEAD_POSE_ANGLES, inputInfo.at(BLOB_HEAD_POSE_ANGLES));
+
+    for (const auto& blobName: {BLOB_LEFT_EYE_IMAGE, BLOB_RIGHT_EYE_IMAGE}) {
+        ieWrapper.expectImageInput(blobName);
+    }
+
+    const auto& outputInfo = ieWrapper.getOutputBlobDimsInfo();
+
+    outputBlobName = ieWrapper.expectSingleOutput();
+    expectAngles(outputBlobName, outputInfo.at(outputBlobName));
 }
 
 cv::Rect GazeEstimator::createEyeBoundingBox(const cv::Point2i& p1,
@@ -82,15 +113,15 @@ void GazeEstimator::estimate(const cv::Mat& image,
         rightEyeImage = rightEyeImageRotated;
     }
 
-    ieWrapper.setInputBlob("head_pose_angles", headPoseAngles);
-    ieWrapper.setInputBlob("left_eye_image", leftEyeImage);
-    ieWrapper.setInputBlob("right_eye_image", rightEyeImage);
+    ieWrapper.setInputBlob(BLOB_HEAD_POSE_ANGLES, headPoseAngles);
+    ieWrapper.setInputBlob(BLOB_LEFT_EYE_IMAGE, leftEyeImage);
+    ieWrapper.setInputBlob(BLOB_RIGHT_EYE_IMAGE, rightEyeImage);
 
     ieWrapper.infer();
 
     std::vector<float> rawResults;
 
-    ieWrapper.getOutputBlob(rawResults);
+    ieWrapper.getOutputBlob(outputBlobName, rawResults);
 
     cv::Point3f gazeVector;
     gazeVector.x = rawResults[0];
diff --git a/demos/gaze_estimation_demo/src/head_pose_estimator.cpp b/demos/gaze_estimation_demo/src/head_pose_estimator.cpp
index 15543ac9a07..8c3ded1c64a 100644
--- a/demos/gaze_estimation_demo/src/head_pose_estimator.cpp
+++ b/demos/gaze_estimation_demo/src/head_pose_estimator.cpp
@@ -8,10 +8,35 @@
 #include "head_pose_estimator.hpp"
 
 namespace gaze_estimation {
+
+const std::pair<const char*, float cv::Point3f::*> OUTPUTS[] = {
+    {"angle_y_fc", &cv::Point3f::x},
+    {"angle_p_fc", &cv::Point3f::y},
+    {"angle_r_fc", &cv::Point3f::z},
+};
+
 HeadPoseEstimator::HeadPoseEstimator(InferenceEngine::Core& ie,
                                      const std::string& modelPath,
                                      const std::string& deviceName):
                    ieWrapper(ie, modelPath, deviceName) {
+    inputBlobName = ieWrapper.expectSingleInput();
+    ieWrapper.expectImageInput(inputBlobName);
+
+    const auto& outputInfo = ieWrapper.getOutputBlobDimsInfo();
+
+    for (const auto& output: OUTPUTS) {
+        auto it = outputInfo.find(output.first);
+
+        if (it == outputInfo.end())
+            throw std::runtime_error(
+                modelPath + ": expected to have output named \"" + output.first + "\"");
+
+        bool correctDims = std::all_of(it->second.begin(), it->second.end(),
+            [](unsigned long n) { return n == 1; });
+        if (!correctDims)
+            throw std::runtime_error(
+                modelPath + ": expected \"" + output.first + "\" to have total size 1");
+    }
 }
 
 void HeadPoseEstimator::estimate(const cv::Mat& image,
@@ -19,19 +44,15 @@ void HeadPoseEstimator::estimate(const cv::Mat& image,
     auto faceBoundingBox = outputResults.faceBoundingBox;
     auto faceCrop(cv::Mat(image, faceBoundingBox));
 
-    auto inputBlobName = ieWrapper.getIputBlobDimsInfo().begin()->first;
-
     ieWrapper.setInputBlob(inputBlobName, faceCrop);
     ieWrapper.infer();
-    std::vector<float> y, p, r;
 
-    ieWrapper.getOutputBlob("angle_y_fc", y);
-    ieWrapper.getOutputBlob("angle_p_fc", p);
-    ieWrapper.getOutputBlob("angle_r_fc", r);
+    std::vector<float> outputValue;
 
-    outputResults.headPoseAngles.x = y[0];
-    outputResults.headPoseAngles.y = p[0];
-    outputResults.headPoseAngles.z = r[0];
+    for (const auto &output: OUTPUTS) {
+        ieWrapper.getOutputBlob(output.first, outputValue);
+        outputResults.headPoseAngles.*output.second = outputValue[0];
+    }
 }
 
 void HeadPoseEstimator::printPerformanceCounts() const {
diff --git a/demos/gaze_estimation_demo/src/ie_wrapper.cpp b/demos/gaze_estimation_demo/src/ie_wrapper.cpp
index 62455fcaf48..d33994cdecf 100644
--- a/demos/gaze_estimation_demo/src/ie_wrapper.cpp
+++ b/demos/gaze_estimation_demo/src/ie_wrapper.cpp
@@ -16,10 +16,7 @@ IEWrapper::IEWrapper(InferenceEngine::Core& ie,
                      const std::string& modelPath,
                      const std::string& deviceName):
            modelPath(modelPath), deviceName(deviceName), ie(ie) {
-    netReader.ReadNetwork(modelPath);
-    std::string binFileName = fileNameNoExt(modelPath) + ".bin";
-    netReader.ReadWeights(binFileName);
-    network = netReader.getNetwork();
+    network = ie.ReadNetwork(modelPath);
     setExecPart();
 }
 
@@ -110,27 +107,35 @@ void IEWrapper::getOutputBlob(const std::string& blobName,
     }
 }
 
-void IEWrapper::getOutputBlob(std::vector<float>& output) {
-    output.clear();
-    auto blobName = outputBlobsDimsInfo.begin()->first;
-    auto blobDims = outputBlobsDimsInfo[blobName];
-    auto dataSize = 1;
-    for (auto const& dim : blobDims) {
-        dataSize *= dim;
-    }
-    auto outputBlob = request.GetBlob(blobName);
-    auto buffer = outputBlob->buffer().as<InferenceEngine::PrecisionTrait<InferenceEngine::Precision::FP32>::value_type *>();
+const std::map<std::string, std::vector<unsigned long>>& IEWrapper::getInputBlobDimsInfo() const {
+    return inputBlobsDimsInfo;
+}
+const std::map<std::string, std::vector<unsigned long>>& IEWrapper::getOutputBlobDimsInfo() const {
+    return outputBlobsDimsInfo;
+}
 
-    for (int i = 0; i < dataSize; ++i) {
-        output.push_back(buffer[i]);
+std::string IEWrapper::expectSingleInput() const {
+    if (inputBlobsDimsInfo.size() != 1) {
+        throw std::runtime_error(modelPath + ": expected to have 1 input");
     }
+
+    return inputBlobsDimsInfo.begin()->first;
 }
 
-const std::map<std::string, std::vector<unsigned long>>& IEWrapper::getIputBlobDimsInfo() const {
-    return inputBlobsDimsInfo;
+std::string IEWrapper::expectSingleOutput() const {
+    if (outputBlobsDimsInfo.size() != 1) {
+        throw std::runtime_error(modelPath + ": expected to have 1 output");
+    }
+
+    return outputBlobsDimsInfo.begin()->first;
 }
-const std::map<std::string, std::vector<unsigned long>>& IEWrapper::getOutputBlobDimsInfo() const {
-    return outputBlobsDimsInfo;
+
+void IEWrapper::expectImageInput(const std::string& blobName) const {
+    const auto& dims = inputBlobsDimsInfo.at(blobName);
+
+    if (dims.size() != 4 || dims[0] != 1 || dims[1] != 3) {
+        throw std::runtime_error(modelPath + ": expected \"" + blobName + "\" to have dimensions 1x3xHxW");
+    }
 }
 
 void IEWrapper::infer() {
diff --git a/demos/gaze_estimation_demo/src/landmarks_estimator.cpp b/demos/gaze_estimation_demo/src/landmarks_estimator.cpp
index ee9a12e4d21..8e994916b17 100644
--- a/demos/gaze_estimation_demo/src/landmarks_estimator.cpp
+++ b/demos/gaze_estimation_demo/src/landmarks_estimator.cpp
@@ -12,6 +12,21 @@ LandmarksEstimator::LandmarksEstimator(InferenceEngine::Core& ie,
                                        const std::string& modelPath,
                                        const std::string& deviceName):
                     ieWrapper(ie, modelPath, deviceName) {
+    inputBlobName = ieWrapper.expectSingleInput();
+    ieWrapper.expectImageInput(inputBlobName);
+
+    const auto& outputInfo = ieWrapper.getOutputBlobDimsInfo();
+
+    outputBlobName = ieWrapper.expectSingleOutput();
+    const auto& outputBlobDims = outputInfo.at(outputBlobName);
+
+    bool outputIs1Dim = !outputBlobDims.empty()
+        && std::all_of(outputBlobDims.begin(), outputBlobDims.end() - 1,
+            [](unsigned long n) { return n == 1; });
+
+    if (!outputIs1Dim || outputBlobDims.back() % 2 != 0) {
+        throw std::runtime_error(modelPath + ": expected \"" + outputBlobName + "\" to have dimensions [1x...]2N");
+    }
 }
 
 void LandmarksEstimator::estimate(const cv::Mat& image,
@@ -19,13 +34,11 @@ void LandmarksEstimator::estimate(const cv::Mat& image,
     auto faceBoundingBox = outputResults.faceBoundingBox;
     auto faceCrop(cv::Mat(image, faceBoundingBox));
 
-    auto inputBlobName = ieWrapper.getIputBlobDimsInfo().begin()->first;
-
     ieWrapper.setInputBlob(inputBlobName, faceCrop);
     ieWrapper.infer();
     std::vector<float> rawLandmarks;
 
-    ieWrapper.getOutputBlob(rawLandmarks);
+    ieWrapper.getOutputBlob(outputBlobName, rawLandmarks);
 
     for (unsigned long i = 0; i < rawLandmarks.size() / 2; ++i) {
         int x = static_cast<int>(rawLandmarks[2 * i] * faceCrop.cols + faceBoundingBox.tl().x);
diff --git a/demos/gaze_estimation_demo/src/utils.cpp b/demos/gaze_estimation_demo/src/utils.cpp
index b8349228082..a66897f00d0 100644
--- a/demos/gaze_estimation_demo/src/utils.cpp
+++ b/demos/gaze_estimation_demo/src/utils.cpp
@@ -38,9 +38,6 @@ void initializeIEObject(InferenceEngine::Core& ie,
 
         /** Loading extensions for the CPU device **/
         if ((deviceName.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
             loadedDevices.insert(deviceName);
         }
     }
diff --git a/demos/human_pose_estimation_demo/CMakeLists.txt b/demos/human_pose_estimation_demo/CMakeLists.txt
index f50c924ce38..ddce9118dce 100644
--- a/demos/human_pose_estimation_demo/CMakeLists.txt
+++ b/demos/human_pose_estimation_demo/CMakeLists.txt
@@ -9,4 +9,5 @@ ie_add_sample(NAME human_pose_estimation_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
               INCLUDE_DIRECTORIES "${CMAKE_CURRENT_SOURCE_DIR}/include"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/human_pose_estimation_demo/README.md b/demos/human_pose_estimation_demo/README.md
index ce01fe8d310..65d555b58f2 100644
--- a/demos/human_pose_estimation_demo/README.md
+++ b/demos/human_pose_estimation_demo/README.md
@@ -21,7 +21,7 @@ On the start-up, the application reads command line parameters and loads human p
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./human_pose_estimation_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -36,8 +36,9 @@ Options:
     -d "<device>"              Optional. Specify the target device for Human Pose Estimation (the list of available devices is shown below). Default value is CPU. Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The application looks for a suitable plugin for the specified device.
     -pc                        Optional. Enable per-layer performance report.
     -no_show                   Optional. Do not show processed video.
+    -black                     Optional. Show black background.
     -r                         Optional. Output inference results as raw values.
-
+    -u                         Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields an error message.
diff --git a/demos/human_pose_estimation_demo/include/human_pose_estimation_demo.hpp b/demos/human_pose_estimation_demo/include/human_pose_estimation_demo.hpp
index a410aa24eaa..df46811490c 100644
--- a/demos/human_pose_estimation_demo/include/human_pose_estimation_demo.hpp
+++ b/demos/human_pose_estimation_demo/include/human_pose_estimation_demo.hpp
@@ -7,56 +7,28 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief Message for video argument
 static const char video_message[] = "Required. Path to a video. Default value is \"cam\" to work with camera.";
-
-/// @brief Message for model argument
 static const char human_pose_estimation_model_message[] = "Required. Path to the Human Pose Estimation model (.xml) file.";
-
-/// @brief Message for assigning Human Pose Estimation inference to device
-static const char target_device_message[] = "Optional. Specify the target device for Human Pose Estimation "\
-                                            "(the list of available devices is shown below). Default value is CPU. " \
-                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message[] = "Optional. Specify the target device for Human Pose Estimation "
+                                            "(the list of available devices is shown below). Default value is CPU. "
+                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                             "The application looks for a suitable plugin for the specified device.";
-
-/// @brief Message for performance counter
 static const char performance_counter_message[] = "Optional. Enable per-layer performance report.";
-
-/// @brief Message for not showing processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief Message for raw output
+static const char black_background[] = "Optional. Show black background.";
 static const char raw_output_message[] = "Optional. Output inference results as raw values.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// @brief Defines flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Defines parameter for setting video file <br>
-/// It is a required parameter
 DEFINE_string(i, "cam", video_message);
-
-/// @brief Defines parameter for human pose estimation model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", human_pose_estimation_model_message);
-
-/// @brief Defines parameter for the target device to infer on <br>
-/// It is an optional parameter
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief Defines flag for per-layer performance report <br>
-/// It is an optional parameter
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief Defines flag for disabling processed video showing <br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// @brief Defines flag to output raw results <br>
-/// It is an optional parameter
+DEFINE_bool(black, false, black_background);
 DEFINE_bool(r, false, raw_output_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * @brief This function shows a help message
@@ -72,5 +44,7 @@ static void showUsage() {
     std::cout << "    -d \"<device>\"              " << target_device_message << std::endl;
     std::cout << "    -pc                        " << performance_counter_message << std::endl;
     std::cout << "    -no_show                   " << no_show_processed_video << std::endl;
+    std::cout << "    -black                     " << black_background << std::endl;
     std::cout << "    -r                         " << raw_output_message << std::endl;
+    std::cout << "    -u                         " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/human_pose_estimation_demo/include/human_pose_estimator.hpp b/demos/human_pose_estimation_demo/include/human_pose_estimator.hpp
index b3b419d4757..c48b9a4391d 100644
--- a/demos/human_pose_estimation_demo/include/human_pose_estimator.hpp
+++ b/demos/human_pose_estimation_demo/include/human_pose_estimator.hpp
@@ -15,12 +15,19 @@
 namespace human_pose_estimation {
 class HumanPoseEstimator {
 public:
-    static const size_t keypointsNumber;
+    static const size_t keypointsNumber = 18;
 
     HumanPoseEstimator(const std::string& modelPath,
                        const std::string& targetDeviceName,
                        bool enablePerformanceReport = false);
-    std::vector<HumanPose> estimate(const cv::Mat& image);
+    std::vector<HumanPose> postprocessCurr();
+    void reshape(const cv::Mat& image);
+    void frameToBlobCurr(const cv::Mat& image);
+    void frameToBlobNext(const cv::Mat& image);
+    void startCurr();
+    void startNext();
+    bool readyCurr();
+    void swapRequest();
     ~HumanPoseEstimator();
 
 private:
@@ -47,13 +54,14 @@ class HumanPoseEstimator {
     float foundMidPointsRatioThreshold;
     float minSubsetScore;
     cv::Size inputLayerSize;
+    cv::Size imageSize;
     int upsampleRatio;
     InferenceEngine::Core ie;
     std::string targetDeviceName;
     InferenceEngine::CNNNetwork network;
     InferenceEngine::ExecutableNetwork executableNetwork;
-    InferenceEngine::InferRequest request;
-    InferenceEngine::CNNNetReader netReader;
+    InferenceEngine::InferRequest::Ptr requestNext;
+    InferenceEngine::InferRequest::Ptr requestCurr;
     std::string pafsBlobName;
     std::string heatmapsBlobName;
     bool enablePerformanceReport;
diff --git a/demos/human_pose_estimation_demo/main.cpp b/demos/human_pose_estimation_demo/main.cpp
index 224803d37e7..d73e3301369 100644
--- a/demos/human_pose_estimation_demo/main.cpp
+++ b/demos/human_pose_estimation_demo/main.cpp
@@ -9,9 +9,11 @@
 */
 
 #include <vector>
+#include <chrono>
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 
 #include "human_pose_estimation_demo.hpp"
@@ -60,12 +62,15 @@ int main(int argc, char* argv[]) {
         }
 
         int delay = 33;
-        double inferenceTime = 0.0;
-        cv::Mat image;
-        if (!cap.read(image)) {
+
+        // read input (video) frame
+        cv::Mat curr_frame; cap >> curr_frame;
+        cv::Mat next_frame;
+        if (!cap.grab()) {
             throw std::logic_error("Failed to get frame from cv::VideoCapture");
         }
-        estimator.estimate(image);  // Do not measure network reshape, if it happened
+
+        estimator.reshape(curr_frame);  // Do not measure network reshape, if it happened
 
         std::cout << "To close the application, press 'CTRL+C' here";
         if (!FLAGS_no_show) {
@@ -74,50 +79,159 @@ int main(int argc, char* argv[]) {
         }
         std::cout << std::endl;
 
-        do {
-            double t1 = static_cast<double>(cv::getTickCount());
-            std::vector<HumanPose> poses = estimator.estimate(image);
-            double t2 = static_cast<double>(cv::getTickCount());
-            if (inferenceTime == 0) {
-                inferenceTime = (t2 - t1) / cv::getTickFrequency() * 1000;
-            } else {
-                inferenceTime = inferenceTime * 0.95 + 0.05 * (t2 - t1) / cv::getTickFrequency() * 1000;
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, static_cast<int>(cap.get(cv::CAP_PROP_FRAME_HEIGHT)) - graphSize.height - 10, graphSize);
+        std::vector<HumanPose> poses;
+        bool isLastFrame = false;
+        bool isAsyncMode = false; // execution is always started in SYNC mode
+        bool isModeChanged = false; // set to true when execution mode is changed (SYNC<->ASYNC)
+        bool blackBackground = FLAGS_black;
+
+        typedef std::chrono::duration<double, std::ratio<1, 1000>> ms;
+        auto total_t0 = std::chrono::high_resolution_clock::now();
+        auto wallclock = std::chrono::high_resolution_clock::now();
+        double render_time = 0;
+
+        while (true) {
+            auto t0 = std::chrono::high_resolution_clock::now();
+            //here is the first asynchronus point:
+            //in the async mode we capture frame to populate the NEXT infer request
+            //in the regular mode we capture frame to the current infer request
+
+            if (!cap.read(next_frame)) {
+                if (next_frame.empty()) {
+                    isLastFrame = true; //end of video file
+                } else {
+                    throw std::logic_error("Failed to get frame from cv::VideoCapture");
+                }
+            }
+            if (isAsyncMode) {
+                if (isModeChanged) {
+                    estimator.frameToBlobCurr(curr_frame);
+                }
+                if (!isLastFrame) {
+                    estimator.frameToBlobNext(next_frame);
+                }
+            } else if (!isModeChanged) {
+                estimator.frameToBlobCurr(curr_frame);
             }
-            if (FLAGS_r) {
-                for (HumanPose const& pose : poses) {
-                    std::stringstream rawPose;
-                    rawPose << std::fixed << std::setprecision(0);
-                    for (auto const& keypoint : pose.keypoints) {
-                        rawPose << keypoint.x << "," << keypoint.y << " ";
+            auto t1 = std::chrono::high_resolution_clock::now();
+            double decode_time = std::chrono::duration_cast<ms>(t1 - t0).count();
+
+            t0 = std::chrono::high_resolution_clock::now();
+            // Main sync point:
+            // in the trully Async mode we start the NEXT infer request, while waiting for the CURRENT to complete
+            // in the regular mode we start the CURRENT request and immediately wait for it's completion
+            if (isAsyncMode) {
+                if (isModeChanged) {
+                    estimator.startCurr();
+                }
+                if (!isLastFrame) {
+                    estimator.startNext();
+                }
+            } else if (!isModeChanged) {
+                estimator.startCurr();
+            }
+
+            if (estimator.readyCurr()) {
+                t1 = std::chrono::high_resolution_clock::now();
+                ms detection = std::chrono::duration_cast<ms>(t1 - t0);
+                t0 = std::chrono::high_resolution_clock::now();
+                ms wall = std::chrono::duration_cast<ms>(t0 - wallclock);
+                wallclock = t0;
+
+                t0 = std::chrono::high_resolution_clock::now();
+
+                if (!FLAGS_no_show) {
+                    if (blackBackground) {
+                        curr_frame = cv::Mat::zeros(curr_frame.size(), curr_frame.type());
                     }
-                    rawPose << pose.score;
-                    std::cout << rawPose.str() << std::endl;
+                    std::ostringstream out;
+                    out << "OpenCV cap/render time: " << std::fixed << std::setprecision(2)
+                        << (decode_time + render_time) << " ms";
+
+                    cv::putText(curr_frame, out.str(), cv::Point2f(0, 25),
+                                cv::FONT_HERSHEY_TRIPLEX, 0.6, cv::Scalar(0, 255, 0));
+                    out.str("");
+                    out << "Wallclock time " << (isAsyncMode ? "(TRUE ASYNC):      " : "(SYNC, press Tab): ");
+                    out << std::fixed << std::setprecision(2) << wall.count()
+                        << " ms (" << 1000.f / wall.count() << " fps)";
+                    cv::putText(curr_frame, out.str(), cv::Point2f(0, 50),
+                                cv::FONT_HERSHEY_TRIPLEX, 0.6, cv::Scalar(0, 0, 255));
+                    if (!isAsyncMode) {  // In the true async mode, there is no way to measure detection time directly
+                        out.str("");
+                        out << "Detection time  : " << std::fixed << std::setprecision(2) << detection.count()
+                        << " ms ("
+                        << 1000.f / detection.count() << " fps)";
+                        cv::putText(curr_frame, out.str(), cv::Point2f(0, 75), cv::FONT_HERSHEY_TRIPLEX, 0.6,
+                            cv::Scalar(255, 0, 0));
+                    }
+                }
+
+                poses = estimator.postprocessCurr();
+
+                if (FLAGS_r) {
+                    if (!poses.empty()) {
+                        std::time_t result = std::time(nullptr);
+                        char timeString[sizeof("2020-01-01 00:00:00: ")];
+                        std::strftime(timeString, sizeof(timeString), "%Y-%m-%d %H:%M:%S: ", std::localtime(&result));
+                        std::cout << timeString;
+                     }
+
+                    for (HumanPose const& pose : poses) {
+                        std::stringstream rawPose;
+                        rawPose << std::fixed << std::setprecision(0);
+                        for (auto const& keypoint : pose.keypoints) {
+                            rawPose << keypoint.x << "," << keypoint.y << " ";
+                        }
+                        rawPose << pose.score;
+                        std::cout << rawPose.str() << std::endl;
+                    }
+                }
+
+                if (!FLAGS_no_show) {
+                    presenter.drawGraphs(curr_frame);
+                    renderHumanPose(poses, curr_frame);
+                    cv::imshow("Human Pose Estimation on " + FLAGS_d, curr_frame);
+                    t1 = std::chrono::high_resolution_clock::now();
+                    render_time = std::chrono::duration_cast<ms>(t1 - t0).count();
                 }
             }
 
-            if (FLAGS_no_show) {
-                continue;
+            if (isLastFrame) {
+                break;
             }
 
-            renderHumanPose(poses, image);
+            if (isModeChanged) {
+                isModeChanged = false;
+            }
 
-            cv::Mat fpsPane(35, 155, CV_8UC3);
-            fpsPane.setTo(cv::Scalar(153, 119, 76));
-            cv::Mat srcRegion = image(cv::Rect(8, 8, fpsPane.cols, fpsPane.rows));
-            cv::addWeighted(srcRegion, 0.4, fpsPane, 0.6, 0, srcRegion);
-            std::stringstream fpsSs;
-            fpsSs << "FPS: " << int(1000.0f / inferenceTime * 100) / 100.0f;
-            cv::putText(image, fpsSs.str(), cv::Point(16, 32),
-                        cv::FONT_HERSHEY_COMPLEX, 0.8, cv::Scalar(0, 0, 255));
-            cv::imshow("ICV Human Pose Estimation", image);
+            // Final point:
+            // in the truly Async mode we swap the NEXT and CURRENT requests for the next iteration
+            curr_frame = next_frame;
+            next_frame = cv::Mat();
+            if (isAsyncMode) {
+                estimator.swapRequest();
+            }
 
-            int key = cv::waitKey(delay) & 255;
+            const int key = cv::waitKey(delay) & 255;
             if (key == 'p') {
                 delay = (delay == 0) ? 33 : 0;
-            } else if (key == 27) {
+            } else if (27 == key) { // Esc
                 break;
+            } else if (9 == key) { // Tab
+                isAsyncMode ^= true;
+                isModeChanged = true;
+            } else if (32 == key) { // Space
+                blackBackground ^= true;
             }
-        } while (cap.read(image));
+            presenter.handleKey(key);
+        }
+
+        auto total_t1 = std::chrono::high_resolution_clock::now();
+        ms total = std::chrono::duration_cast<ms>(total_t1 - total_t0);
+        std::cout << "Total Inference time: " << total.count() << std::endl;
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         std::cerr << "[ ERROR ] " << error.what() << std::endl;
diff --git a/demos/human_pose_estimation_demo/src/human_pose_estimator.cpp b/demos/human_pose_estimation_demo/src/human_pose_estimator.cpp
index 9b3a925177b..5b2fa35c370 100644
--- a/demos/human_pose_estimation_demo/src/human_pose_estimator.cpp
+++ b/demos/human_pose_estimation_demo/src/human_pose_estimator.cpp
@@ -14,8 +14,6 @@
 #include "peak.hpp"
 
 namespace human_pose_estimation {
-const size_t HumanPoseEstimator::keypointsNumber = 18;
-
 HumanPoseEstimator::HumanPoseEstimator(const std::string& modelPath,
                                        const std::string& targetDeviceName_,
                                        bool enablePerformanceReport)
@@ -36,27 +34,74 @@ HumanPoseEstimator::HumanPoseEstimator(const std::string& modelPath,
         ie.SetConfig({{InferenceEngine::PluginConfigParams::KEY_PERF_COUNT,
                        InferenceEngine::PluginConfigParams::YES}});
     }
-    netReader.ReadNetwork(modelPath);
-    std::string binFileName = fileNameNoExt(modelPath) + ".bin";
-    netReader.ReadWeights(binFileName);
-    network = netReader.getNetwork();
-    InferenceEngine::InputInfo::Ptr inputInfo = network.getInputsInfo().begin()->second;
-    inputLayerSize = cv::Size(inputInfo->getTensorDesc().getDims()[3], inputInfo->getTensorDesc().getDims()[2]);
-    inputInfo->setPrecision(InferenceEngine::Precision::U8);
+    network = ie.ReadNetwork(modelPath);
+
+    const auto& inputInfo = network.getInputsInfo();
+
+    if (inputInfo.size() != 1) {
+        throw std::runtime_error(modelPath + ": expected to have 1 input");
+    }
+
+    const auto& imageInputInfo = *inputInfo.begin();
+    const auto& imageInputDims = imageInputInfo.second->getTensorDesc().getDims();
+
+    if (imageInputDims.size() != 4 || imageInputDims[0] != 1 || imageInputDims[1] != 3) {
+        throw std::runtime_error(
+            modelPath + ": expected \"" + imageInputInfo.first + "\" to have dimensions 1x3xHxW");
+    }
+
+    inputLayerSize = cv::Size(imageInputDims[3], imageInputDims[2]);
+    imageInputInfo.second->setPrecision(InferenceEngine::Precision::U8);
 
     InferenceEngine::OutputsDataMap outputInfo = network.getOutputsInfo();
-    auto outputBlobsIt = outputInfo.begin();
-    pafsBlobName = outputBlobsIt->first;
-    heatmapsBlobName = (++outputBlobsIt)->first;
+
+    if (outputInfo.size() != 2) {
+        throw std::runtime_error(modelPath + ": expected to have 2 outputs");
+    }
+
+    auto outputIt = outputInfo.begin();
+
+    const auto& pafsOutputInfo = *outputIt++;
+
+    pafsBlobName = pafsOutputInfo.first;
+
+    const auto& pafsOutputDims = pafsOutputInfo.second->getTensorDesc().getDims();
+
+    if (pafsOutputDims.size() != 4 || pafsOutputDims[0] != 1
+            || pafsOutputDims[1] != 2 * (keypointsNumber + 1)) {
+        throw std::runtime_error(
+            modelPath + ": expected \"" + pafsBlobName + "\" to have dimensions "
+                "1x" + std::to_string(2 * (keypointsNumber + 1)) + "xHFMxWFM");
+    }
+
+    const auto& heatmapsOutputInfo = *outputIt++;
+
+    heatmapsBlobName = heatmapsOutputInfo.first;
+
+    const auto& heatmapsOutputDims = heatmapsOutputInfo.second->getTensorDesc().getDims();
+
+    if (heatmapsOutputDims.size() != 4 || heatmapsOutputDims[0] != 1
+            || heatmapsOutputDims[1] != keypointsNumber + 1) {
+        throw std::runtime_error(
+            modelPath + ": expected \"" + heatmapsBlobName + "\" to have dimensions "
+                "1x" + std::to_string(keypointsNumber + 1) + "xHFMxWFM");
+    }
+
+    if (pafsOutputDims[2] != heatmapsOutputDims[2] || pafsOutputDims[3] != heatmapsOutputDims[3]) {
+        throw std::runtime_error(
+            modelPath + ": expected \"" + pafsBlobName + "\" and \"" + heatmapsBlobName + "\""
+                "to have matching last two dimensions");
+    }
 
     executableNetwork = ie.LoadNetwork(network, targetDeviceName);
-    request = executableNetwork.CreateInferRequest();
+    requestNext = executableNetwork.CreateInferRequestPtr();
+    requestCurr = executableNetwork.CreateInferRequestPtr();
 }
 
-std::vector<HumanPose> HumanPoseEstimator::estimate(const cv::Mat& image) {
+void HumanPoseEstimator::reshape(const cv::Mat& image){
     CV_Assert(image.type() == CV_8UC3);
 
-    cv::Size imageSize = image.size();
+    imageSize = image.size();
     if (inputWidthIsChanged(imageSize)) {
         auto input_shapes = network.getInputShapes();
         std::string input_name;
@@ -67,19 +112,50 @@ std::vector<HumanPose> HumanPoseEstimator::estimate(const cv::Mat& image) {
         input_shapes[input_name] = input_shape;
         network.reshape(input_shapes);
         executableNetwork = ie.LoadNetwork(network, targetDeviceName);
-        request = executableNetwork.CreateInferRequest();
+        requestNext = executableNetwork.CreateInferRequestPtr();
+        requestCurr = executableNetwork.CreateInferRequestPtr();
+        std::cout << "Reshape needed" << std::endl;
     }
-    InferenceEngine::Blob::Ptr input = request.GetBlob(network.getInputsInfo().begin()->first);
+}
+
+void HumanPoseEstimator::frameToBlobCurr(const cv::Mat& image) {
+    CV_Assert(image.type() == CV_8UC3);
+    InferenceEngine::Blob::Ptr input = requestCurr->GetBlob(network.getInputsInfo().begin()->first);
+    auto buffer = input->buffer().as<InferenceEngine::PrecisionTrait<InferenceEngine::Precision::U8>::value_type *>();
+    preprocess(image, buffer);
+}
+
+void HumanPoseEstimator::frameToBlobNext(const cv::Mat& image) {
+    CV_Assert(image.type() == CV_8UC3);
+    InferenceEngine::Blob::Ptr input = requestNext->GetBlob(network.getInputsInfo().begin()->first);
     auto buffer = input->buffer().as<InferenceEngine::PrecisionTrait<InferenceEngine::Precision::U8>::value_type *>();
     preprocess(image, buffer);
+}
+
+void HumanPoseEstimator::startCurr() {
+    requestCurr->StartAsync();
+}
+
+void HumanPoseEstimator::startNext() {
+    requestNext->StartAsync();
+}
 
-    request.Infer();
+bool HumanPoseEstimator::readyCurr() {
+    if (InferenceEngine::OK == requestCurr->Wait(InferenceEngine::IInferRequest::WaitMode::RESULT_READY)) {
+        return true;
+    } else {
+        return false;
+    }
+}
+
+void HumanPoseEstimator::swapRequest() {
+    requestCurr.swap(requestNext);
+}
 
-    InferenceEngine::Blob::Ptr pafsBlob = request.GetBlob(pafsBlobName);
-    InferenceEngine::Blob::Ptr heatMapsBlob = request.GetBlob(heatmapsBlobName);
-    CV_Assert(heatMapsBlob->getTensorDesc().getDims()[1] == keypointsNumber + 1);
-    InferenceEngine::SizeVector heatMapDims =
-            heatMapsBlob->getTensorDesc().getDims();
+std::vector<HumanPose> HumanPoseEstimator::postprocessCurr() {
+    InferenceEngine::Blob::Ptr pafsBlob = requestCurr->GetBlob(pafsBlobName);
+    InferenceEngine::Blob::Ptr heatMapsBlob = requestCurr->GetBlob(heatmapsBlobName);
+    InferenceEngine::SizeVector heatMapDims = heatMapsBlob->getTensorDesc().getDims();
     std::vector<HumanPose> poses = postprocess(
             heatMapsBlob->buffer(),
             heatMapDims[2] * heatMapDims[3],
@@ -101,8 +177,7 @@ void HumanPoseEstimator::preprocess(const cv::Mat& image, uint8_t* buffer) const
                        cv::BORDER_CONSTANT, meanPixel);
     std::vector<cv::Mat> planes(3);
     for (size_t pId = 0; pId < planes.size(); pId++) {
-        planes[pId] = cv::Mat(inputLayerSize, CV_8UC1,
-                              buffer + pId * inputLayerSize.area());
+        planes[pId] = cv::Mat(inputLayerSize, CV_8UC1, buffer + pId * inputLayerSize.area());
     }
     cv::split(paddedImage, planes);
 }
@@ -233,7 +308,7 @@ HumanPoseEstimator::~HumanPoseEstimator() {
     try {
         if (enablePerformanceReport) {
             std::cout << "Performance counts for " << modelPath << std::endl << std::endl;
-            printPerformanceCounts(request, std::cout, getFullDeviceName(ie, targetDeviceName), false);
+            printPerformanceCounts(*requestCurr, std::cout, getFullDeviceName(ie, targetDeviceName), false);
         }
     }
     catch (...) {
diff --git a/demos/human_pose_estimation_demo/src/peak.cpp b/demos/human_pose_estimation_demo/src/peak.cpp
index a9bb1cb9eb7..26602293ff2 100644
--- a/demos/human_pose_estimation_demo/src/peak.cpp
+++ b/demos/human_pose_estimation_demo/src/peak.cpp
@@ -6,6 +6,8 @@
 #include <utility>
 #include <vector>
 
+#include <samples/common.hpp>
+
 #include "peak.hpp"
 
 namespace human_pose_estimation {
@@ -112,11 +114,11 @@ std::vector<HumanPose> groupPeaksToPoses(const std::vector<std::vector<Peak> >&
                                          const float foundMidPointsRatioThreshold,
                                          const int minJointsNumber,
                                          const float minSubsetScore) {
-    const std::vector<std::pair<int, int> > limbIdsHeatmap = {
+    static const std::pair<int, int> limbIdsHeatmap[] = {
         {2, 3}, {2, 6}, {3, 4}, {4, 5}, {6, 7}, {7, 8}, {2, 9}, {9, 10}, {10, 11}, {2, 12}, {12, 13}, {13, 14},
         {2, 1}, {1, 15}, {15, 17}, {1, 16}, {16, 18}, {3, 17}, {6, 18}
     };
-    const std::vector<std::pair<int, int> > limbIdsPaf = {
+    static const std::pair<int, int> limbIdsPaf[] = {
         {31, 32}, {39, 40}, {33, 34}, {35, 36}, {41, 42}, {43, 44}, {19, 20}, {21, 22}, {23, 24}, {25, 26},
         {27, 28}, {29, 30}, {47, 48}, {49, 50}, {53, 54}, {51, 52}, {55, 56}, {37, 38}, {45, 46}
     };
@@ -126,7 +128,7 @@ std::vector<HumanPose> groupPeaksToPoses(const std::vector<std::vector<Peak> >&
          candidates.insert(candidates.end(), peaks.begin(), peaks.end());
     }
     std::vector<HumanPoseByPeaksIndices> subset(0, HumanPoseByPeaksIndices(keypointsNumber));
-    for (size_t k = 0; k < limbIdsPaf.size(); k++) {
+    for (size_t k = 0; k < arraySize(limbIdsPaf); k++) {
         std::vector<TwoJointsConnection> connections;
         const int mapIdxOffset = keypointsNumber + 1;
         std::pair<cv::Mat, cv::Mat> scoreMid = { pafs[limbIdsPaf[k].first - mapIdxOffset],
diff --git a/demos/human_pose_estimation_demo/src/render_human_pose.cpp b/demos/human_pose_estimation_demo/src/render_human_pose.cpp
index a2a45a479ce..7e29222a0e2 100644
--- a/demos/human_pose_estimation_demo/src/render_human_pose.cpp
+++ b/demos/human_pose_estimation_demo/src/render_human_pose.cpp
@@ -14,7 +14,7 @@ namespace human_pose_estimation {
 void renderHumanPose(const std::vector<HumanPose>& poses, cv::Mat& image) {
     CV_Assert(image.type() == CV_8UC3);
 
-    const std::vector<cv::Scalar> colors = {
+    static const cv::Scalar colors[HumanPoseEstimator::keypointsNumber] = {
         cv::Scalar(255, 0, 0), cv::Scalar(255, 85, 0), cv::Scalar(255, 170, 0),
         cv::Scalar(255, 255, 0), cv::Scalar(170, 255, 0), cv::Scalar(85, 255, 0),
         cv::Scalar(0, 255, 0), cv::Scalar(0, 255, 85), cv::Scalar(0, 255, 170),
@@ -22,7 +22,7 @@ void renderHumanPose(const std::vector<HumanPose>& poses, cv::Mat& image) {
         cv::Scalar(0, 0, 255), cv::Scalar(85, 0, 255), cv::Scalar(170, 0, 255),
         cv::Scalar(255, 0, 255), cv::Scalar(255, 0, 170), cv::Scalar(255, 0, 85)
     };
-    const std::vector<std::pair<int, int> > limbKeypointsIds = {
+    static const std::pair<int, int> limbKeypointsIds[] = {
         {1, 2},  {1, 5},   {2, 3},
         {3, 4},  {5, 6},   {6, 7},
         {1, 8},  {8, 9},   {9, 10},
diff --git a/demos/interactive_face_detection_demo/CMakeLists.txt b/demos/interactive_face_detection_demo/CMakeLists.txt
index 55fc53c60cd..6dc75b6e9e7 100644
--- a/demos/interactive_face_detection_demo/CMakeLists.txt
+++ b/demos/interactive_face_detection_demo/CMakeLists.txt
@@ -8,4 +8,5 @@ file (GLOB MAIN_HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/*.h*)
 ie_add_sample(NAME interactive_face_detection_demo
               SOURCES ${MAIN_SRC}
               HEADERS ${MAIN_HEADERS}
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/interactive_face_detection_demo/README.md b/demos/interactive_face_detection_demo/README.md
index 055be3a04f6..a9fbb4a97c8 100644
--- a/demos/interactive_face_detection_demo/README.md
+++ b/demos/interactive_face_detection_demo/README.md
@@ -37,7 +37,7 @@ The new Async API operates with a new notion of the Infer Request that encapsula
 
 Running the application with the `-h` option yields the following usage message:
 
-```sh
+```
 ./interactive_face_detection_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -83,6 +83,7 @@ Options:
     -loop_video                Optional. Enable playing video on a loop
     -no_smooth                 Optional. Do not smooth person attributes
     -no_show_emotion_bar       Optional. Do not show emotion bar
+    -u                         Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields the usage message given above and an error message.
diff --git a/demos/interactive_face_detection_demo/detectors.cpp b/demos/interactive_face_detection_demo/detectors.cpp
index b2135483c6e..e26bd3d6c6b 100644
--- a/demos/interactive_face_detection_demo/detectors.cpp
+++ b/demos/interactive_face_detection_demo/detectors.cpp
@@ -22,15 +22,12 @@
 #include <samples/slog.hpp>
 
 #include <ie_iextension.h>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 #include "detectors.hpp"
 
 using namespace InferenceEngine;
 
-BaseDetection::BaseDetection(std::string topoName,
+BaseDetection::BaseDetection(const std::string &topoName,
                              const std::string &pathToModel,
                              const std::string &deviceForInference,
                              int maxBatch, bool isBatchDynamic, bool isAsync,
@@ -120,17 +117,13 @@ void FaceDetection::enqueue(const cv::Mat &frame) {
     enquedFrames = 1;
 }
 
-CNNNetwork FaceDetection::read()  {
+CNNNetwork FaceDetection::read(const InferenceEngine::Core& ie)  {
     slog::info << "Loading network files for Face Detection" << slog::endl;
-    CNNNetReader netReader;
     /** Read network model **/
-    netReader.ReadNetwork(pathToModel);
+    auto network = ie.ReadNetwork(pathToModel);
     /** Set batch size to 1 **/
     slog::info << "Batch size is set to " << maxBatch << slog::endl;
-    netReader.getNetwork().setBatchSize(maxBatch);
-    /** Extract model name and load its weights **/
-    std::string binFileName = fileNameNoExt(pathToModel) + ".bin";
-    netReader.ReadWeights(binFileName);
+    network.setBatchSize(maxBatch);
     /** Read labels (if any)**/
     std::string labelFileName = fileNameNoExt(pathToModel) + ".labels";
 
@@ -143,7 +136,7 @@ CNNNetwork FaceDetection::read()  {
     /** SSD-based network should have one input and one output **/
     // ---------------------------Check inputs -------------------------------------------------------------
     slog::info << "Checking Face Detection network inputs" << slog::endl;
-    InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InputsDataMap inputInfo(network.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Face Detection network should have only one input");
     }
@@ -153,14 +146,14 @@ CNNNetwork FaceDetection::read()  {
 
     // ---------------------------Check outputs ------------------------------------------------------------
     slog::info << "Checking Face Detection network outputs" << slog::endl;
-    OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    OutputsDataMap outputInfo(network.getOutputsInfo());
     if (outputInfo.size() != 1) {
         throw std::logic_error("Face Detection network should have only one output");
     }
     DataPtr& _output = outputInfo.begin()->second;
     output = outputInfo.begin()->first;
 
-    const CNNLayerPtr outputLayer = netReader.getNetwork().getLayerByName(output.c_str());
+    const CNNLayerPtr outputLayer = network.getLayerByName(output.c_str());
     if (outputLayer->type != "DetectionOutput") {
         throw std::logic_error("Face Detection network output layer(" + outputLayer->name +
                                ") should be DetectionOutput, but was " +  outputLayer->type);
@@ -192,7 +185,7 @@ CNNNetwork FaceDetection::read()  {
 
     slog::info << "Loading Face Detection model to the "<< deviceForInference << " device" << slog::endl;
     input = inputInfo.begin()->first;
-    return netReader.getNetwork();
+    return network;
 }
 
 void FaceDetection::fetchResults() {
@@ -300,25 +293,18 @@ AgeGenderDetection::Result AgeGenderDetection::operator[] (int idx) const {
     return r;
 }
 
-CNNNetwork AgeGenderDetection::read() {
+CNNNetwork AgeGenderDetection::read(const InferenceEngine::Core& ie) {
     slog::info << "Loading network files for Age/Gender Recognition network" << slog::endl;
-    CNNNetReader netReader;
     // Read network
-    netReader.ReadNetwork(pathToModel);
-
+    auto network = ie.ReadNetwork(pathToModel);
     // Set maximum batch size to be used.
-    netReader.getNetwork().setBatchSize(maxBatch);
-    slog::info << "Batch size is set to " << netReader.getNetwork().getBatchSize() << " for Age/Gender Recognition network" << slog::endl;
-
-
-    // Extract model name and load its weights
-    std::string binFileName = fileNameNoExt(pathToModel) + ".bin";
-    netReader.ReadWeights(binFileName);
+    network.setBatchSize(maxBatch);
+    slog::info << "Batch size is set to " << network.getBatchSize() << " for Age/Gender Recognition network" << slog::endl;
 
     // ---------------------------Check inputs -------------------------------------------------------------
     // Age/Gender Recognition network should have one input and two outputs
     slog::info << "Checking Age/Gender Recognition network inputs" << slog::endl;
-    InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InputsDataMap inputInfo(network.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Age/Gender Recognition network should have only one input");
     }
@@ -329,7 +315,7 @@ CNNNetwork AgeGenderDetection::read() {
 
     // ---------------------------Check outputs ------------------------------------------------------------
     slog::info << "Checking Age/Gender Recognition network outputs" << slog::endl;
-    OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    OutputsDataMap outputInfo(network.getOutputsInfo());
     if (outputInfo.size() != 2) {
         throw std::logic_error("Age/Gender Recognition network should have two output layers");
     }
@@ -377,7 +363,7 @@ CNNNetwork AgeGenderDetection::read() {
 
     slog::info << "Loading Age/Gender Recognition model to the "<< deviceForInference << " plugin" << slog::endl;
     _enabled = true;
-    return netReader.getNetwork();
+    return network;
 }
 
 
@@ -434,21 +420,17 @@ HeadPoseDetection::Results HeadPoseDetection::operator[] (int idx) const {
     return r;
 }
 
-CNNNetwork HeadPoseDetection::read() {
+CNNNetwork HeadPoseDetection::read(const InferenceEngine::Core& ie) {
     slog::info << "Loading network files for Head Pose Estimation network" << slog::endl;
-    CNNNetReader netReader;
     // Read network model
-    netReader.ReadNetwork(pathToModel);
+    auto network = ie.ReadNetwork(pathToModel);
     // Set maximum batch size
-    netReader.getNetwork().setBatchSize(maxBatch);
-    slog::info << "Batch size is set to  " << netReader.getNetwork().getBatchSize() << " for Head Pose Estimation network" << slog::endl;
-    // Extract model name and load its weights
-    std::string binFileName = fileNameNoExt(pathToModel) + ".bin";
-    netReader.ReadWeights(binFileName);
+    network.setBatchSize(maxBatch);
+    slog::info << "Batch size is set to  " << network.getBatchSize() << " for Head Pose Estimation network" << slog::endl;
 
     // ---------------------------Check inputs -------------------------------------------------------------
     slog::info << "Checking Head Pose Estimation network inputs" << slog::endl;
-    InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InputsDataMap inputInfo(network.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Head Pose Estimation network should have only one input");
     }
@@ -459,7 +441,7 @@ CNNNetwork HeadPoseDetection::read() {
 
     // ---------------------------Check outputs ------------------------------------------------------------
     slog::info << "Checking Head Pose Estimation network outputs" << slog::endl;
-    OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    OutputsDataMap outputInfo(network.getOutputsInfo());
     if (outputInfo.size() != 3) {
         throw std::logic_error("Head Pose Estimation network should have 3 outputs");
     }
@@ -499,7 +481,7 @@ CNNNetwork HeadPoseDetection::read() {
     slog::info << "Loading Head Pose Estimation model to the "<< deviceForInference << " plugin" << slog::endl;
 
     _enabled = true;
-    return netReader.getNetwork();
+    return network;
 }
 
 EmotionsDetection::EmotionsDetection(const std::string &pathToModel,
@@ -538,8 +520,6 @@ void EmotionsDetection::enqueue(const cv::Mat &face) {
 }
 
 std::map<std::string, float> EmotionsDetection::operator[] (int idx) const {
-    // Vector of supported emotions
-    static const std::vector<std::string> emotionsVec = {"neutral", "happy", "sad", "surprise", "anger"};
     auto emotionsVecSize = emotionsVec.size();
 
     Blob::Ptr emotionsBlob = request->GetBlob(outputEmotions);
@@ -578,27 +558,19 @@ std::map<std::string, float> EmotionsDetection::operator[] (int idx) const {
     return emotions;
 }
 
-CNNNetwork EmotionsDetection::read() {
+CNNNetwork EmotionsDetection::read(const InferenceEngine::Core& ie) {
     slog::info << "Loading network files for Emotions Recognition" << slog::endl;
-    InferenceEngine::CNNNetReader netReader;
     // Read network model
-    netReader.ReadNetwork(pathToModel);
-
+    auto network = ie.ReadNetwork(pathToModel);
     // Set maximum batch size
-    netReader.getNetwork().setBatchSize(maxBatch);
-    slog::info << "Batch size is set to " << netReader.getNetwork().getBatchSize() << " for Emotions Recognition" << slog::endl;
-
-
-    // Extract model name and load its weights
-    std::string binFileName = fileNameNoExt(pathToModel) + ".bin";
-    netReader.ReadWeights(binFileName);
-
+    network.setBatchSize(maxBatch);
+    slog::info << "Batch size is set to " << network.getBatchSize() << " for Emotions Recognition" << slog::endl;
     // -----------------------------------------------------------------------------------------------------
 
     // Emotions Recognition network should have one input and one output.
     // ---------------------------Check inputs -------------------------------------------------------------
     slog::info << "Checking Emotions Recognition network inputs" << slog::endl;
-    InferenceEngine::InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InferenceEngine::InputsDataMap inputInfo(network.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Emotions Recognition network should have only one input");
     }
@@ -609,7 +581,7 @@ CNNNetwork EmotionsDetection::read() {
 
     // ---------------------------Check outputs ------------------------------------------------------------
     slog::info << "Checking Emotions Recognition network outputs" << slog::endl;
-    InferenceEngine::OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    InferenceEngine::OutputsDataMap outputInfo(network.getOutputsInfo());
     if (outputInfo.size() != 1) {
         throw std::logic_error("Emotions Recognition network should have one output layer");
     }
@@ -641,7 +613,7 @@ CNNNetwork EmotionsDetection::read() {
 
     slog::info << "Loading Emotions Recognition model to the "<< deviceForInference << " plugin" << slog::endl;
     _enabled = true;
-    return netReader.getNetwork();
+    return network;
 }
 
 
@@ -708,21 +680,17 @@ std::vector<float> FacialLandmarksDetection::operator[] (int idx) const {
     return normedLandmarks;
 }
 
-CNNNetwork FacialLandmarksDetection::read() {
+CNNNetwork FacialLandmarksDetection::read(const InferenceEngine::Core& ie) {
     slog::info << "Loading network files for Facial Landmarks Estimation" << slog::endl;
-    CNNNetReader netReader;
     // Read network model
-    netReader.ReadNetwork(pathToModel);
+    auto network = ie.ReadNetwork(pathToModel);
     // Set maximum batch size
-    netReader.getNetwork().setBatchSize(maxBatch);
-    slog::info << "Batch size is set to  " << netReader.getNetwork().getBatchSize() << " for Facial Landmarks Estimation network" << slog::endl;
-    // Extract model name and load its weights
-    std::string binFileName = fileNameNoExt(pathToModel) + ".bin";
-    netReader.ReadWeights(binFileName);
+    network.setBatchSize(maxBatch);
+    slog::info << "Batch size is set to  " << network.getBatchSize() << " for Facial Landmarks Estimation network" << slog::endl;
 
     // ---------------------------Check inputs -------------------------------------------------------------
     slog::info << "Checking Facial Landmarks Estimation network inputs" << slog::endl;
-    InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InputsDataMap inputInfo(network.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Facial Landmarks Estimation network should have only one input");
     }
@@ -733,7 +701,7 @@ CNNNetwork FacialLandmarksDetection::read() {
 
     // ---------------------------Check outputs ------------------------------------------------------------
     slog::info << "Checking Facial Landmarks Estimation network outputs" << slog::endl;
-    OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    OutputsDataMap outputInfo(network.getOutputsInfo());
     if (outputInfo.size() != 1) {
         throw std::logic_error("Facial Landmarks Estimation network should have only one output");
     }
@@ -763,7 +731,7 @@ CNNNetwork FacialLandmarksDetection::read() {
     slog::info << "Loading Facial Landmarks Estimation model to the "<< deviceForInference << " plugin" << slog::endl;
 
     _enabled = true;
-    return netReader.getNetwork();
+    return network;
 }
 
 
@@ -780,7 +748,7 @@ void Load::into(InferenceEngine::Core & ie, const std::string & deviceName, bool
             config[PluginConfigParams::KEY_DYN_BATCH_ENABLED] = PluginConfigParams::YES;
         }
 
-        detector.net = ie.LoadNetwork(detector.read(), deviceName, config);
+        detector.net = ie.LoadNetwork(detector.read(ie), deviceName, config);
     }
 }
 
diff --git a/demos/interactive_face_detection_demo/detectors.hpp b/demos/interactive_face_detection_demo/detectors.hpp
index b36639f850f..2c52a0abdf1 100644
--- a/demos/interactive_face_detection_demo/detectors.hpp
+++ b/demos/interactive_face_detection_demo/detectors.hpp
@@ -45,7 +45,7 @@ struct BaseDetection {
     mutable bool _enabled;
     const bool doRawOutputMessages;
 
-    BaseDetection(std::string topoName,
+    BaseDetection(const std::string &topoName,
                   const std::string &pathToModel,
                   const std::string &deviceForInference,
                   int maxBatch, bool isBatchDynamic, bool isAsync,
@@ -54,7 +54,7 @@ struct BaseDetection {
     virtual ~BaseDetection();
 
     InferenceEngine::ExecutableNetwork* operator ->();
-    virtual InferenceEngine::CNNNetwork read() = 0;
+    virtual InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) = 0;
     virtual void submitRequest();
     virtual void wait();
     bool enabled() const;
@@ -90,7 +90,7 @@ struct FaceDetection : BaseDetection {
                   float bb_enlarge_coefficient, float bb_dx_coefficient,
                   float bb_dy_coefficient);
 
-    InferenceEngine::CNNNetwork read() override;
+    InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) override;
     void submitRequest() override;
 
     void enqueue(const cv::Mat &frame);
@@ -113,7 +113,7 @@ struct AgeGenderDetection : BaseDetection {
                        int maxBatch, bool isBatchDynamic, bool isAsync,
                        bool doRawOutputMessages);
 
-    InferenceEngine::CNNNetwork read() override;
+    InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) override;
     void submitRequest() override;
 
     void enqueue(const cv::Mat &face);
@@ -139,7 +139,7 @@ struct HeadPoseDetection : BaseDetection {
                       int maxBatch, bool isBatchDynamic, bool isAsync,
                       bool doRawOutputMessages);
 
-    InferenceEngine::CNNNetwork read() override;
+    InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) override;
     void submitRequest() override;
 
     void enqueue(const cv::Mat &face);
@@ -156,7 +156,7 @@ struct EmotionsDetection : BaseDetection {
                       int maxBatch, bool isBatchDynamic, bool isAsync,
                       bool doRawOutputMessages);
 
-    InferenceEngine::CNNNetwork read() override;
+    InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) override;
     void submitRequest() override;
 
     void enqueue(const cv::Mat &face);
@@ -177,7 +177,7 @@ struct FacialLandmarksDetection : BaseDetection {
                              int maxBatch, bool isBatchDynamic, bool isAsync,
                              bool doRawOutputMessages);
 
-    InferenceEngine::CNNNetwork read() override;
+    InferenceEngine::CNNNetwork read(const InferenceEngine::Core& ie) override;
     void submitRequest() override;
 
     void enqueue(const cv::Mat &face);
diff --git a/demos/interactive_face_detection_demo/interactive_face_detection.hpp b/demos/interactive_face_detection_demo/interactive_face_detection.hpp
index bae31f48a16..98d038e87e6 100644
--- a/demos/interactive_face_detection_demo/interactive_face_detection.hpp
+++ b/demos/interactive_face_detection_demo/interactive_face_detection.hpp
@@ -10,254 +10,99 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message";
-
-/// @brief Message for images argument
 static const char input_video_message[] = "Required. Path to a video file (specify \"cam\" to work with camera).";
-
-/// @brief Message for images argument
 static const char output_video_message[] = "Optional. Path to an output video file.";
-
-/// @brief message for model argument
 static const char face_detection_model_message[] = "Required. Path to an .xml file with a trained Face Detection model.";
 static const char age_gender_model_message[] = "Optional. Path to an .xml file with a trained Age/Gender Recognition model.";
 static const char head_pose_model_message[] = "Optional. Path to an .xml file with a trained Head Pose Estimation model.";
 static const char emotions_model_message[] = "Optional. Path to an .xml file with a trained Emotions Recognition model.";
 static const char facial_landmarks_model_message[] = "Optional. Path to an .xml file with a trained Facial Landmarks Estimation model.";
-
-/// @brief Message for plugin argument
-static const char plugin_message[] = "Plugin name. For example, CPU. If this parameter is specified, " \
-"the demo will look for this plugin only.";
-
-/// @brief Message for assigning face detection calculation to device
-static const char target_device_message[] = "Optional. Target device for Face Detection network (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief Message for assigning age/gender calculation to device
-static const char target_device_message_ag[] = "Optional. Target device for Age/Gender Recognition network (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief Message for assigning head pose calculation to device
-static const char target_device_message_hp[] = "Optional. Target device for Head Pose Estimation network (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief Message for assigning emotions calculation to device
-static const char target_device_message_em[] = "Optional. Target device for Emotions Recognition network (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief Message for assigning Facial Landmarks Estimation network to device
-static const char target_device_message_lm[] = "Optional. Target device for Facial Landmarks Estimation network " \
-"(the list of available devices is shown below). Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for device specified.";
-
-/// @brief Message for the maximum number of simultaneously processed faces for Age Gender network
-static const char num_batch_ag_message[] = "Optional. Number of maximum simultaneously processed faces for Age/Gender Recognition network " \
-"(by default, it is 16)";
-
-/// @brief Message for the maximum number of simultaneously processed faces for Head Pose network
-static const char num_batch_hp_message[] = "Optional. Number of maximum simultaneously processed faces for Head Pose Estimation network " \
-"(by default, it is 16)";
-
-/// @brief Message for the maximum number of simultaneously processed faces for Emotions network
-static const char num_batch_em_message[] = "Optional. Number of maximum simultaneously processed faces for Emotions Recognition network " \
-"(by default, it is 16)";
-
-/// @brief Message for the maximum number of simultaneously processed faces for Facial Landmarks Estimation network
-static const char num_batch_lm_message[] = "Optional. Number of maximum simultaneously processed faces for Facial Landmarks Estimation network " \
-"(by default, it is 16)";
-
-/// @brief Message for dynamic batching support for AgeGender net
+static const char plugin_message[] = "Plugin name. For example, CPU. If this parameter is specified, "
+                                     "the demo will look for this plugin only.";
+static const char target_device_message[] = "Optional. Target device for Face Detection network (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device.";
+static const char target_device_message_ag[] = "Optional. Target device for Age/Gender Recognition network (the list of available devices is shown below). "
+                                               "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for a specified device.";
+static const char target_device_message_hp[] = "Optional. Target device for Head Pose Estimation network (the list of available devices is shown below). "
+                                               "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for a specified device.";
+static const char target_device_message_em[] = "Optional. Target device for Emotions Recognition network (the list of available devices is shown below). "
+                                               "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for a specified device.";
+static const char target_device_message_lm[] = "Optional. Target device for Facial Landmarks Estimation network "
+                                               "(the list of available devices is shown below). Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                               "The demo will look for a suitable plugin for device specified.";
+static const char num_batch_ag_message[] = "Optional. Number of maximum simultaneously processed faces for Age/Gender Recognition network "
+                                           "(by default, it is 16)";
+static const char num_batch_hp_message[] = "Optional. Number of maximum simultaneously processed faces for Head Pose Estimation network "
+                                           "(by default, it is 16)";
+static const char num_batch_em_message[] = "Optional. Number of maximum simultaneously processed faces for Emotions Recognition network "
+                                           "(by default, it is 16)";
+static const char num_batch_lm_message[] = "Optional. Number of maximum simultaneously processed faces for Facial Landmarks Estimation network "
+                                           "(by default, it is 16)";
 static const char dyn_batch_ag_message[] = "Optional. Enable dynamic batch size for Age/Gender Recognition network";
-
-/// @brief Message for dynamic batching support for HeadPose net
 static const char dyn_batch_hp_message[] = "Optional. Enable dynamic batch size for Head Pose Estimation network";
-
-/// @brief Message for dynamic batching support for Emotions net
 static const char dyn_batch_em_message[] = "Optional. Enable dynamic batch size for Emotions Recognition network";
-
-/// @brief Message for dynamic batching support for Facial Landmarks Estimation network
 static const char dyn_batch_lm_message[] = "Optional. Enable dynamic batch size for Facial Landmarks Estimation network";
-
-/// @brief Message for performance counters
 static const char performance_counter_message[] = "Optional. Enable per-layer performance report";
-
-/// @brief Message for GPU custom kernels description
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to an .xml file with the kernels description.";
-
-/// @brief Message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementation.";
-
-/// @brief Message for probability threshold argument
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to an .xml file with the kernels description.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementation.";
 static const char thresh_output_message[] = "Optional. Probability threshold for detections";
-
-/// @brief Message for face enlarge coefficient argument
 static const char bb_enlarge_coef_output_message[] = "Optional. Coefficient to enlarge/reduce the size of the bounding box around the detected face";
-
-/// @brief Message raw output flag
 static const char raw_output_message[] = "Optional. Output inference results as raw values";
-
-/// @brief Message do not wait for keypress after input stream completed
 static const char no_wait_for_keypress_message[] = "Optional. Do not wait for key press in the end.";
-
-/// @brief Message do not show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief Message for asynchronous mode
 static const char async_message[] = "Optional. Enable asynchronous mode";
-
-/// @brief Message for shifting coefficient by dx for detected faces
 static const char dx_coef_output_message[] = "Optional. Coefficient to shift the bounding box around the detected face along the Ox axis";
-
-/// @brief Message for shifting coefficient by dy for detected faces
 static const char dy_coef_output_message[] = "Optional. Coefficient to shift the bounding box around the detected face along the Oy axis";
-
-/// @brief Message for fps argument
 static const char fps_output_message[] = "Optional. Maximum FPS for playing video";
-
-/// @brief Message for looping video argument
 static const char loop_video_output_message[] = "Optional. Enable playing video on a loop";
-
-/// @brief Message for smooth argument
 static const char no_smooth_output_message[] = "Optional. Do not smooth person attributes";
-
-/// @brief Message for smooth argument
 static const char no_show_emotion_bar_message[] = "Optional. Do not show emotion bar";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// \brief Define flag for showing help message<br>
 DEFINE_bool(h, false, help_message);
-
-/// \brief Define parameter for set image file<br>
-/// It is a required parameter
 DEFINE_string(i, "", input_video_message);
-
-/// \brief Define parameter for an output video file<br>
-/// It is an optional parameter
 DEFINE_string(o, "", output_video_message);
-
-/// \brief Define parameter for Face Detection model file<br>
-/// It is a required parameter
 DEFINE_string(m, "", face_detection_model_message);
-
-/// \brief Define parameter for Age Gender Recognition model file<br>
-/// It is a optional parameter
 DEFINE_string(m_ag, "", age_gender_model_message);
-
-/// \brief Define parameter for Head Pose Estimation model file<br>
-/// It is a optional parameter
 DEFINE_string(m_hp, "", head_pose_model_message);
-
-/// \brief Define parameter for Emotions Recognition model file<br>
-/// It is a optional parameter
 DEFINE_string(m_em, "", emotions_model_message);
-
-/// \brief Define parameter for Facial Landmarks Estimation model file<br>
-/// It is an optional parameter
 DEFINE_string(m_lm, "", facial_landmarks_model_message);
-
-/// \brief target device for Face Detection network<br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief Define parameter for target device for Age/Gender Recognition network<br>
 DEFINE_string(d_ag, "CPU", target_device_message_ag);
-
-/// \brief Define parameter for target device for Head Pose Estimation network<br>
 DEFINE_string(d_hp, "CPU", target_device_message_hp);
-
-/// \brief Define parameter for target device for Emotions Recognition network<br>
 DEFINE_string(d_em, "CPU", target_device_message_em);
-
-/// \brief Define parameter for target device for Facial Landmarks Estimation network<br>
 DEFINE_string(d_lm, "CPU", target_device_message_lm);
-
-/// \brief Define parameter for maximum batch size for Age/Gender Recognition network<br>
 DEFINE_uint32(n_ag, 16, num_batch_ag_message);
-
-/// \brief Define parameter to enable dynamic batch size for Age/Gender Recognition network<br>
 DEFINE_bool(dyn_ag, false, dyn_batch_ag_message);
-
-/// \brief Define parameter for maximum batch size for Head Pose Estimation network<br>
 DEFINE_uint32(n_hp, 16, num_batch_hp_message);
-
-/// \brief Define parameter to enable dynamic batch size for Head Pose Estimation network<br>
 DEFINE_bool(dyn_hp, false, dyn_batch_hp_message);
-
-/// \brief Define parameter for maximum batch size for Emotions Recognition network<br>
 DEFINE_uint32(n_em, 16, num_batch_em_message);
-
-/// \brief Define parameter to enable dynamic batch size for Emotions Recognition network<br>
 DEFINE_bool(dyn_em, false, dyn_batch_em_message);
-
-/// \brief Define parameter for maximum batch size for Facial Landmarks Estimation network<br>
 DEFINE_uint32(n_lm, 16, num_batch_em_message);
-
-/// \brief Define parameter to enable dynamic batch size for Facial Landmarks Estimation network<br>
 DEFINE_bool(dyn_lm, false, dyn_batch_em_message);
-
-/// \brief Define parameter to enable per-layer performance report<br>
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief Define parameter for GPU custom kernels path<br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Define parameter for absolute path to CPU library with user layers<br>
-/// It is an optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Define a flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// \brief Define a parameter for probability threshold for detections<br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, thresh_output_message);
-
-/// \brief Define a parameter to enlarge the bounding box around the detected face for more robust operation of face analytics networks<br>
-/// It is an optional parameter
 DEFINE_double(bb_enlarge_coef, 1.2, bb_enlarge_coef_output_message);
-
-/// \brief Define a flag to disable keypress exit<br>
-/// It is an optional parameter
 DEFINE_bool(no_wait, false, no_wait_for_keypress_message);
-
-/// \brief Define a flag to disable showing processed video<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// \brief Define a flag to enable aynchronous execution<br>
-/// It is an optional parameter
 DEFINE_bool(async, false, async_message);
-
-/// \brief Define a parameter to shift face bounding box by Ox for more robust operation of face analytics networks<br>
-/// It is an optional parameter
 DEFINE_double(dx_coef, 1, dx_coef_output_message);
-
-/// \brief Define a parameter to shift face bounding box by Oy for more robust operation of face analytics networks<br>
-/// It is an optional parameter
 DEFINE_double(dy_coef, 1, dy_coef_output_message);
-
-/// \brief Define a parameter to play video with defined fps<br>
-/// It is an optional parameter
 DEFINE_double(fps, -1, fps_output_message);
-
-/// \brief Define a flag to loop video<br>
-/// It is an optional parameter
 DEFINE_bool(loop_video, false, loop_video_output_message);
-
-/// \brief Define a flag to disable smoothing person attributes<br>
-/// It is an optional parameter
 DEFINE_bool(no_smooth, false, no_smooth_output_message);
-
-/// \brief Define a flag to disable showing emotion bar<br>
-/// It is an optional parameter
 DEFINE_bool(no_show_emotion_bar, false, no_show_emotion_bar_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 
 /**
@@ -306,4 +151,5 @@ static void showUsage() {
     std::cout << "    -loop_video                " << loop_video_output_message << std::endl;
     std::cout << "    -no_smooth                 " << no_smooth_output_message << std::endl;
     std::cout << "    -no_show_emotion_bar       " << no_show_emotion_bar_message << std::endl;
+    std::cout << "    -u                         " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/interactive_face_detection_demo/main.cpp b/demos/interactive_face_detection_demo/main.cpp
index 332a07e1bd3..e77e79fc1b9 100644
--- a/demos/interactive_face_detection_demo/main.cpp
+++ b/demos/interactive_face_detection_demo/main.cpp
@@ -25,6 +25,7 @@
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
 
@@ -34,9 +35,6 @@
 #include "visualizer.hpp"
 
 #include <ie_iextension.h>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 using namespace InferenceEngine;
 
@@ -108,7 +106,7 @@ int main(int argc, char *argv[]) {
         Core ie;
 
         std::set<std::string> loadedDevices;
-        std::vector<std::pair<std::string, std::string>> cmdOptions = {
+        std::pair<std::string, std::string> cmdOptions[] = {
             {FLAGS_d, FLAGS_m},
             {FLAGS_d_ag, FLAGS_m_ag},
             {FLAGS_d_hp, FLAGS_m_hp},
@@ -138,9 +136,6 @@ int main(int argc, char *argv[]) {
 
             /** Loading extensions for the CPU device **/
             if ((deviceName.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-                ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
 
                 if (!FLAGS_l.empty()) {
                     // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
@@ -180,8 +175,6 @@ int main(int argc, char *argv[]) {
 
         std::ostringstream out;
         size_t framesCounter = 0;
-        bool frameReadStatus;
-        bool isLastFrame;
         int delay = 1;
         double msrate = -1;
         cv::Mat prev_frame, next_frame;
@@ -207,18 +200,23 @@ int main(int argc, char *argv[]) {
         prev_frame = frame.clone();
 
         // Reading the next frame
-        frameReadStatus = cap.read(frame);
+        bool frameReadStatus = cap.read(frame);
 
         std::cout << "To close the application, press 'CTRL+C' here";
         if (!FLAGS_no_show) {
-            std::cout << " or switch to the output window and press any key";
+            std::cout << " or switch to the output window and press Q or Esc";
         }
         std::cout << std::endl;
 
+        const cv::Point THROUGHPUT_METRIC_POSITION{10, 45};
+
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, THROUGHPUT_METRIC_POSITION.y + 15, graphSize);
+
         while (true) {
             timer.start("total");
             framesCounter++;
-            isLastFrame = !frameReadStatus;
+            bool isLastFrame = !frameReadStatus;
 
             // Retrieving face detection results for the previous frame
             faceDetector.wait();
@@ -289,7 +287,7 @@ int main(int argc, char *argv[]) {
                     float intensity_mean = calcMean(prev_frame(rect));
 
                     if ((face == nullptr) ||
-                        ((face != nullptr) && ((std::abs(intensity_mean - face->_intensity_mean) / face->_intensity_mean) > 0.07f))) {
+                        ((std::abs(intensity_mean - face->_intensity_mean) / face->_intensity_mean) > 0.07f)) {
                         face = std::make_shared<Face>(id++, rect);
                     } else {
                         prev_faces.remove(face);
@@ -330,12 +328,14 @@ int main(int argc, char *argv[]) {
                 faces.push_back(face);
             }
 
+            presenter.drawGraphs(prev_frame);
+
             //  Visualizing results
             if (!FLAGS_no_show || !FLAGS_o.empty()) {
                 out.str("");
                 out << "Total image throughput: " << std::fixed << std::setprecision(2)
                     << 1000.f / (timer["total"].getSmoothedDuration()) << " fps";
-                cv::putText(prev_frame, out.str(), cv::Point2f(10, 45), cv::FONT_HERSHEY_TRIPLEX, 1.2,
+                cv::putText(prev_frame, out.str(), THROUGHPUT_METRIC_POSITION, cv::FONT_HERSHEY_TRIPLEX, 1,
                             cv::Scalar(255, 0, 0), 2);
 
                 // drawing faces
@@ -367,8 +367,12 @@ int main(int argc, char *argv[]) {
                     cv::waitKey(0);
                 }
                 break;
-            } else if (!FLAGS_no_show && -1 != cv::waitKey(delay)) {
-                break;
+            } else if (!FLAGS_no_show) {
+                int key = cv::waitKey(delay);
+                if (27 == key || 'Q' == key || 'q' == key) {
+                    break;
+                }
+                presenter.handleKey(key);
             }
         }
 
@@ -383,6 +387,8 @@ int main(int argc, char *argv[]) {
             emotionsDetector.printPerformanceCounts(getFullDeviceName(ie, FLAGS_d_em));
             facialLandmarksDetector.printPerformanceCounts(getFullDeviceName(ie, FLAGS_d_lm));
         }
+
+        std::cout << presenter.reportMeans() << '\n';
         // ---------------------------------------------------------------------------------------------------
 
         if (!FLAGS_o.empty()) {
diff --git a/demos/mask_rcnn_demo/CMakeLists.txt b/demos/mask_rcnn_demo/CMakeLists.txt
index 872e3c4f363..2d8cb775ce1 100644
--- a/demos/mask_rcnn_demo/CMakeLists.txt
+++ b/demos/mask_rcnn_demo/CMakeLists.txt
@@ -5,5 +5,4 @@
 ie_add_sample(NAME mask_rcnn_demo
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/mask_rcnn_demo.h"
-              DEPENDENCIES format_reader
               OPENCV_DEPENDENCIES imgcodecs)
diff --git a/demos/mask_rcnn_demo/README.md b/demos/mask_rcnn_demo/README.md
index e43fa4f1ec9..b8cdcfa88a2 100644
--- a/demos/mask_rcnn_demo/README.md
+++ b/demos/mask_rcnn_demo/README.md
@@ -13,7 +13,7 @@ Upon the start-up, the demo application reads command line parameters and loads
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./mask_rcnn_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -23,13 +23,13 @@ mask_rcnn_demo [OPTION]
 Options:
 
     -h                                Print a usage message.
-    -i "<path>"                       Required. Path to an .bmp image.
+    -i "<path>"                       Required. Path to a .bmp image.
     -m "<path>"                       Required. Path to an .xml file with a trained model.
       -l "<absolute_path>"            Required for CPU custom layers. Absolute path to a shared library with the kernels implementations.
           Or
       -c "<absolute_path>"            Required for GPU custom kernels. Absolute path to the .xml file with the kernels descriptions.
-    -d "<device>"                     Optional. Specify the target device to infer on (the list of available devices is shown below). Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The demo will look for a suitable plugin for a specified device (CPU by default).
-    -detection_output_name "<string>" Optional. The name of detection output layer. Default value is "detection_output"
+    -d "<device>"                     Optional. Specify the target device to infer on (the list of available devices is shown below). Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The demo will look for a suitable plugin for a specified device (CPU by default)
+    -detection_output_name "<string>" Optional. The name of detection output layer. Default value is "reshape_do_2d"
     -masks_name "<string>"            Optional. The name of masks layer. Default value is "masks"
 ```
 
@@ -41,7 +41,7 @@ To run the demo, you can use public or pre-trained models. To download the pre-t
 
 You can use the following command to do inference on CPU on an image using a trained network:
 ```sh
-./mask_rcnn_demo -i <path_to_image>/inputImage.bmp -m <path_to_model>/faster_rcnn.xml
+./mask_rcnn_demo -i <path_to_image>/inputImage.bmp -m <path_to_model>/mask_rcnn_inception_resnet_v2_atrous_coco.xml
 ```
 
 ## Demo Output
diff --git a/demos/mask_rcnn_demo/main.cpp b/demos/mask_rcnn_demo/main.cpp
index 35728359ea6..ea1abc4c96a 100644
--- a/demos/mask_rcnn_demo/main.cpp
+++ b/demos/mask_rcnn_demo/main.cpp
@@ -17,11 +17,6 @@
 #include <iomanip>
 
 #include <inference_engine.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
-
-#include <format_reader_ptr.h>
 
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
@@ -63,27 +58,15 @@ int main(int argc, char *argv[]) {
         }
 
         /** This vector stores paths to the processed images **/
-        std::vector<std::string> images;
-        parseInputFilesArguments(images);
-        if (images.empty()) throw std::logic_error("No suitable images were found");
+        std::vector<std::string> imagePaths;
+        parseInputFilesArguments(imagePaths);
+        if (imagePaths.empty()) throw std::logic_error("No suitable images were found");
         // -----------------------------------------------------------------------------------------------------
 
         // ---------------------Load inference engine------------------------------------------------
         slog::info << "Loading Inference Engine" << slog::endl;
         Core ie;
 
-#ifdef WITH_EXTENSIONS
-        /** Loading default extensions **/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-             * cpu_extensions library is compiled from "extension" folder containing
-             * custom MKLDNNPlugin layer implementations. These layers are not supported
-             * by mkldnn, but they can be useful for inferring custom topologies.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
             auto extension_ptr = make_so_pointer<InferenceEngine::IExtension>(FLAGS_l);
@@ -105,14 +88,8 @@ int main(int argc, char *argv[]) {
         // --------------------Load network (Generated xml/bin files)-------------------------------------------
         slog::info << "Loading network files" << slog::endl;
 
-        InferenceEngine::CNNNetReader networkReader;
         /** Read network model **/
-        networkReader.ReadNetwork(FLAGS_m);
-
-        /** Extract model name and load weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        networkReader.ReadWeights(binFileName);
-        auto network = networkReader.getNetwork();
+        auto network = ie.ReadNetwork(FLAGS_m);
 
         // add DetectionOutput layer as output so we can get detected boxes and their probabilities
         network.addOutput(FLAGS_detection_output_name.c_str(), 0);
@@ -141,44 +118,38 @@ int main(int argc, char *argv[]) {
         const TensorDesc& inputDesc = inputInfo[imageInputName]->getTensorDesc();
         IE_ASSERT(inputDesc.getDims().size() == 4);
         size_t netBatchSize = getTensorBatch(inputDesc);
-        size_t netInputChannels = getTensorChannels(inputDesc);
         size_t netInputHeight = getTensorHeight(inputDesc);
         size_t netInputWidth = getTensorWidth(inputDesc);
 
         slog::info << "Network batch size is " << netBatchSize << slog::endl;
 
-        /** Collect images data ptrs **/
-        std::vector<std::shared_ptr<unsigned char>> imagesData;
-        std::vector<cv::Mat> images_cv;
+        /** Collect images **/
+        std::vector<cv::Mat> images;
 
-        if (netBatchSize > images.size()) {
-            slog::warn << "Network batch size is greater than number of images (" << images.size() <<
+        if (netBatchSize > imagePaths.size()) {
+            slog::warn << "Network batch size is greater than number of images (" << imagePaths.size() <<
                        "), some input files will be duplicated" << slog::endl;
-        } else if (netBatchSize < images.size()) {
-            slog::warn << "Network batch size is less than number of images (" << images.size() <<
+        } else if (netBatchSize < imagePaths.size()) {
+            slog::warn << "Network batch size is less than number of images (" << imagePaths.size() <<
                        "), some input files will be ignored" << slog::endl;
         }
 
         for (size_t i = 0, inputIndex = 0; i < netBatchSize; i++, inputIndex++) {
-            if (inputIndex >= images.size()) {
+            if (inputIndex >= imagePaths.size()) {
                 inputIndex = 0;
             }
-            slog::info << "Prepare image " << images[inputIndex] << slog::endl;
+            slog::info << "Prepare image " << imagePaths[inputIndex] << slog::endl;
 
-            images_cv.push_back(cv::imread(images[inputIndex], cv::IMREAD_COLOR));
+            cv::Mat image = cv::imread(imagePaths[inputIndex], cv::IMREAD_COLOR);
 
-            FormatReader::ReaderPtr reader(images[inputIndex].c_str());
-            if (reader.get() == nullptr) {
-                slog::warn << "Image " + images[inputIndex] + " cannot be read!" << slog::endl;
+            if (image.empty()) {
+                slog::warn << "Image " + imagePaths[inputIndex] + " cannot be read!" << slog::endl;
                 continue;
             }
-            /** Getting image data **/
-            std::shared_ptr<unsigned char> data(reader->getData(netInputWidth, netInputHeight));
-            if (data != nullptr) {
-                imagesData.push_back(data);
-            }
+
+            images.push_back(image);
         }
-        if (imagesData.empty()) throw std::logic_error("Valid input images were not found!");
+        if (images.empty()) throw std::logic_error("Valid input images were not found!");
 
         // -----------------------------------------------------------------------------------------------------
 
@@ -211,21 +182,9 @@ int main(int argc, char *argv[]) {
 
             /** Fill first input tensor with images. First b channel, then g and r channels **/
             if (inputInfoItem.second->getTensorDesc().getDims().size() == 4) {
-                auto data = input->buffer().as<PrecisionTrait<Precision::U8>::value_type *>();
-                size_t image_size = netInputHeight * netInputWidth;
-
                 /** Iterate over all input images **/
-                for (size_t image_id = 0; image_id < imagesData.size(); ++image_id) {
-                    /** Iterate over all pixels in image (b,g,r) **/
-                    for (size_t pid = 0; pid < image_size; pid++) {
-                        /** Iterate over all channels **/
-                        for (size_t ch = 0; ch < netInputChannels; ++ch) {
-                            /**          [images stride + channels stride + pixel id ] all in bytes            **/
-                            data[image_id * image_size * netInputChannels + ch * image_size + pid] = imagesData.at(
-                                    image_id).get()[pid * netInputChannels + ch];
-                        }
-                    }
-                }
+                for (size_t image_id = 0; image_id < images.size(); ++image_id)
+                    matU8ToBlob<unsigned char>(images[image_id], input, image_id);
             }
 
             /** Fill second input tensor with image info **/
@@ -257,7 +216,7 @@ int main(int argc, char *argv[]) {
         const float PROBABILITY_THRESHOLD = 0.2f;
         const float MASK_THRESHOLD = 0.5f;  // threshold used to determine whether mask pixel corresponds to object or to background
         // amount of elements in each detected box description (batch, label, prob, x1, y1, x2, y2)
-        IE_ASSERT(do_blob->getTensorDesc().getDims().size() == 4);
+        IE_ASSERT(do_blob->getTensorDesc().getDims().size() == 2);
         size_t BOX_DESCRIPTION_SIZE = do_blob->getTensorDesc().getDims().back();
 
         const TensorDesc& masksDesc = masks_blob->getTensorDesc();
@@ -270,34 +229,10 @@ int main(int argc, char *argv[]) {
 
         size_t box_stride = W * H * C;
 
-        // some colours
-        std::vector<std::vector<short>> colors = {
-            {128, 64,  128},
-            {232, 35,  244},
-            {70,  70,  70},
-            {156, 102, 102},
-            {153, 153, 190},
-            {153, 153, 153},
-            {30,  170, 250},
-            {0,   220, 220},
-            {35,  142, 107},
-            {152, 251, 152},
-            {180, 130, 70},
-            {60,  20,  220},
-            {0,   0,   255},
-            {142, 0,   0},
-            {70,  0,   0},
-            {100, 60,  0},
-            {90,  0,   0},
-            {230, 0,   0},
-            {32,  11,  119},
-            {0,   74,  111},
-            {81,  0,   81}
-        };
         std::map<size_t, size_t> class_color;
 
         std::vector<cv::Mat> output_images;
-        for (const auto &img : images_cv) {
+        for (const auto &img : images) {
             output_images.push_back(img.clone());
         }
 
@@ -310,17 +245,16 @@ int main(int argc, char *argv[]) {
             if (batch >= static_cast<int>(netBatchSize))
                 throw std::logic_error("Invalid batch ID within detection output box");
             float prob = box_info[2];
-            float x1 = std::min(std::max(0.0f, box_info[3] * images_cv[batch].size().width), static_cast<float>(images_cv[batch].size().width));
-            float y1 = std::min(std::max(0.0f, box_info[4] * images_cv[batch].size().height), static_cast<float>(images_cv[batch].size().height));
-            float x2 = std::min(std::max(0.0f, box_info[5] * images_cv[batch].size().width), static_cast<float>(images_cv[batch].size().width));
-            float y2 = std::min(std::max(0.0f, box_info[6] * images_cv[batch].size().height), static_cast<float>(images_cv[batch].size().height));
-            int box_width = std::min(static_cast<int>(std::max(0.0f, x2 - x1)), images_cv[batch].size().width);
-            int box_height = std::min(static_cast<int>(std::max(0.0f, y2 - y1)), images_cv[batch].size().height);
+            float x1 = std::min(std::max(0.0f, box_info[3] * images[batch].cols), static_cast<float>(images[batch].cols));
+            float y1 = std::min(std::max(0.0f, box_info[4] * images[batch].rows), static_cast<float>(images[batch].rows));
+            float x2 = std::min(std::max(0.0f, box_info[5] * images[batch].cols), static_cast<float>(images[batch].cols));
+            float y2 = std::min(std::max(0.0f, box_info[6] * images[batch].rows), static_cast<float>(images[batch].rows));
+            int box_width = std::min(static_cast<int>(std::max(0.0f, x2 - x1)), images[batch].cols);
+            int box_height = std::min(static_cast<int>(std::max(0.0f, y2 - y1)), images[batch].rows);
             auto class_id = static_cast<size_t>(box_info[1] + 1e-6f);
             if (prob > PROBABILITY_THRESHOLD) {
-                if (class_color.find(class_id) == class_color.end())
-                    class_color[class_id] = class_color.size();
-                auto& color = colors[class_color[class_id]];
+                size_t color_index = class_color.emplace(class_id, class_color.size()).first->second;
+                auto& color = CITYSCAPES_COLORS[color_index % arraySize(CITYSCAPES_COLORS)];
                 float* mask_arr = masks_data + box_stride * box + H * W * (class_id - 1);
                 slog::info << "Detected class " << class_id << " with probability " << prob << " from batch " << batch
                            << ": [" << x1 << ", " << y1 << "], [" << x2 << ", " << y2 << "]" << slog::endl;
@@ -333,13 +267,9 @@ int main(int argc, char *argv[]) {
                 cv::Mat resized_mask_mat(box_height, box_width, CV_32FC1);
                 cv::resize(mask_mat, resized_mask_mat, cv::Size(box_width, box_height));
 
-                cv::Mat uchar_resized_mask(box_height, box_width, images_cv[batch].type());
-
-                for (int h = 0; h < resized_mask_mat.size().height; ++h)
-                    for (int w = 0; w < resized_mask_mat.size().width; ++w)
-                        for (int ch = 0; ch < uchar_resized_mask.channels(); ++ch)
-                            uchar_resized_mask.at<cv::Vec3b>(h, w)[ch] = resized_mask_mat.at<float>(h, w) > MASK_THRESHOLD ?
-                                                                            255 * color[ch]: roi_input_img.at<cv::Vec3b>(h, w)[ch];
+                cv::Mat uchar_resized_mask(box_height, box_width, CV_8UC3,
+                    cv::Scalar(color.blue(), color.green(), color.red()));
+                roi_input_img.copyTo(uchar_resized_mask, resized_mask_mat <= MASK_THRESHOLD);
 
                 cv::addWeighted(uchar_resized_mask, alpha, roi_input_img, 1.0f - alpha, 0.0f, roi_input_img);
                 cv::rectangle(output_images[batch], roi, cv::Scalar(0, 0, 1), 1);
diff --git a/demos/mask_rcnn_demo/mask_rcnn_demo.h b/demos/mask_rcnn_demo/mask_rcnn_demo.h
index af05f0c536b..5a30909e649 100644
--- a/demos/mask_rcnn_demo/mask_rcnn_demo.h
+++ b/demos/mask_rcnn_demo/mask_rcnn_demo.h
@@ -9,60 +9,26 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
-static const char image_message[] = "Required. Path to an .bmp image.";
-
-/// @brief message for model argument
-static const char model_message[] = "Required. Path to an .xml file with a trained model.";\
-
-/// @brief message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). " \
-"Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device (CPU by default)";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to the .xml file with the kernels descriptions.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementations.";
-
-/// @brief message for detection output layer name argument
-static const char detection_output_layer_name_message[] = "Optional. The name of detection output layer. Default value is \"detection_output\"";
-
-/// @brief message for masks layer name argument
+static const char image_message[] = "Required. Path to a .bmp image.";
+static const char model_message[] = "Required. Path to an .xml file with a trained model.";
+static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). "
+                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device (CPU by default)";
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to the .xml file with the kernels descriptions.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementations.";
+static const char detection_output_layer_name_message[] = "Optional. The name of detection output layer. Default value is \"reshape_do_2d\"";
 static const char masks_layer_name_message[] = "Optional. The name of masks layer. Default value is \"masks\"";
 
-/// @brief Define parameter for clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "", image_message);
-
-/// @brief Define parameter for set model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", model_message);
-
-/// @brief device the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief Custom Detection Output layer name
-DEFINE_string(detection_output_name, "detection_output", detection_output_layer_name_message);
-
-/// @brief Custom layer name producing masks
+DEFINE_string(detection_output_name, "reshape_do_2d", detection_output_layer_name_message);
 DEFINE_string(masks_name, "masks", masks_layer_name_message);
 
 /**
diff --git a/demos/mask_rcnn_demo/models.lst b/demos/mask_rcnn_demo/models.lst
new file mode 100644
index 00000000000..1ffb9148c4f
--- /dev/null
+++ b/demos/mask_rcnn_demo/models.lst
@@ -0,0 +1,5 @@
+# This file can be used with the --list option of the model downloader.
+mask_rcnn_inception_resnet_v2_atrous_coco
+mask_rcnn_inception_v2_coco
+mask_rcnn_resnet101_atrous_coco
+mask_rcnn_resnet50_atrous_coco
diff --git a/demos/multichannel_demo/CMakeLists.txt b/demos/multi_channel/CMakeLists.txt
similarity index 87%
rename from demos/multichannel_demo/CMakeLists.txt
rename to demos/multi_channel/CMakeLists.txt
index ff575b7784f..5e00db8ae1e 100644
--- a/demos/multichannel_demo/CMakeLists.txt
+++ b/demos/multi_channel/CMakeLists.txt
@@ -21,5 +21,6 @@ if(MULTICHANNEL_DEMO_USE_NATIVE_CAM)
 endif()
 
 add_subdirectory(common)
-add_subdirectory(fd)
-add_subdirectory(hpe)
+add_subdirectory(face_detection_demo)
+add_subdirectory(human_pose_estimation_demo)
+add_subdirectory(object_detection_demo_yolov3)
diff --git a/demos/multi_channel/README.md b/demos/multi_channel/README.md
new file mode 100644
index 00000000000..3876b9d5a6a
--- /dev/null
+++ b/demos/multi_channel/README.md
@@ -0,0 +1,6 @@
+# Multi-Channel C++ Demos
+
+The demos provide an inference pipeline for three multi-channel scenarios: face detection, human pose estimation and object detection yolov3. For more information, refer to the corresponding pages:
+* [Multi-Channel Face Detection C++ Demo](./face_detection_demo/README.md)
+* [Multi-Channel Human Pose Estimation C++ Demo](./human_pose_estimation_demo/README.md)
+* [Multi-Channel Object Detection Yolov3 C++ Demo](./object_detection_demo_yolov3/README.md)
diff --git a/demos/multichannel_demo/common/CMakeLists.txt b/demos/multi_channel/common/CMakeLists.txt
similarity index 95%
rename from demos/multichannel_demo/common/CMakeLists.txt
rename to demos/multi_channel/common/CMakeLists.txt
index 740f3e1ec46..d5e5d933e40 100644
--- a/demos/multichannel_demo/common/CMakeLists.txt
+++ b/demos/multi_channel/common/CMakeLists.txt
@@ -110,13 +110,7 @@ endif()
 
 target_include_directories(${TARGET_NAME} PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}")
 
-if(TARGET IE::ie_cpu_extension)
-    add_definitions(-DWITH_EXTENSIONS)
-endif()
 target_link_libraries(${TARGET_NAME} ${InferenceEngine_LIBRARIES} gflags ${OpenCV_LIBRARIES})
-if(TARGET IE::ie_cpu_extension)
-    target_link_libraries(${TARGET_NAME} IE::ie_cpu_extension)
-endif()
 
 if(UNIX)
     target_link_libraries( ${TARGET_NAME} pthread)
diff --git a/demos/multichannel_demo/common/decoder.cpp b/demos/multi_channel/common/decoder.cpp
similarity index 100%
rename from demos/multichannel_demo/common/decoder.cpp
rename to demos/multi_channel/common/decoder.cpp
diff --git a/demos/multichannel_demo/common/decoder.hpp b/demos/multi_channel/common/decoder.hpp
similarity index 98%
rename from demos/multichannel_demo/common/decoder.hpp
rename to demos/multi_channel/common/decoder.hpp
index af58f7e6b7f..feb7a9e81de 100644
--- a/demos/multichannel_demo/common/decoder.hpp
+++ b/demos/multi_channel/common/decoder.hpp
@@ -34,6 +34,7 @@ class Decoder final {
 
     explicit Decoder(const Settings& s);
     Decoder(const Decoder&) = delete;
+    Decoder& operator =(const Decoder&) = delete;
     ~Decoder();
 
     struct Stats {
diff --git a/demos/multichannel_demo/common/graph.cpp b/demos/multi_channel/common/graph.cpp
similarity index 90%
rename from demos/multichannel_demo/common/graph.cpp
rename to demos/multi_channel/common/graph.cpp
index 5756f04cbd3..3e50233c396 100644
--- a/demos/multichannel_demo/common/graph.cpp
+++ b/demos/multi_channel/common/graph.cpp
@@ -38,19 +38,9 @@ void loadImgToIEGraph(const cv::Mat& img, size_t batch, void* ieBuffer) {
 }  // namespace
 
 void IEGraph::initNetwork(const std::string& deviceName) {
-    InferenceEngine::CNNNetReader  netReader;
-
-    netReader.ReadNetwork(modelPath);
-    netReader.ReadWeights(weightsPath);
-
-    if (!netReader.isParseSuccess()) {
-        throw std::logic_error("Failed to parse model!");
-    }
+    auto cnnNetwork = ie.ReadNetwork(modelPath);
 
     if (deviceName.find("CPU") != std::string::npos) {
-#ifdef WITH_EXTENSIONS
-        ie.AddExtension(std::make_shared<InferenceEngine::Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
         ie.SetConfig({{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, "NO"}}, "CPU");
     }
     if (!cpuExtensionPath.empty()) {
@@ -67,26 +57,26 @@ void IEGraph::initNetwork(const std::string& deviceName) {
 
     // Set batch size
     if (batchSize > 1) {
-        auto inShapes = netReader.getNetwork().getInputShapes();
+        auto inShapes = cnnNetwork.getInputShapes();
         for (auto& pair : inShapes) {
             auto& dims = pair.second;
             if (!dims.empty()) {
                 dims[0] = batchSize;
             }
         }
-        netReader.getNetwork().reshape(inShapes);
+        cnnNetwork.reshape(inShapes);
     }
 
     InferenceEngine::ExecutableNetwork network;
-    network = ie.LoadNetwork(netReader.getNetwork(), deviceName);
+    network = ie.LoadNetwork(cnnNetwork, deviceName);
 
-    InferenceEngine::InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+    InferenceEngine::InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
     if (inputInfo.size() != 1) {
         throw std::logic_error("Face Detection network should have only one input");
     }
     inputDataBlobName = inputInfo.begin()->first;
 
-    InferenceEngine::OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+    InferenceEngine::OutputsDataMap outputInfo(cnnNetwork.getOutputsInfo());
     outputDataBlobNames.reserve(outputInfo.size());
     for (const auto& i : outputInfo) {
         outputDataBlobNames.push_back(i.first);
@@ -97,6 +87,9 @@ void IEGraph::initNetwork(const std::string& deviceName) {
         availableRequests.push(req);
     }
 
+    if (postLoad != nullptr)
+        postLoad(outputDataBlobNames, cnnNetwork);
+
     availableRequests.front()->StartAsync();
     availableRequests.front()->Wait(InferenceEngine::IInferRequest::WaitMode::RESULT_READY);
 }
@@ -119,9 +112,8 @@ void IEGraph::start(GetterFunc getterFunc, PostprocessingFunc postprocessingFunc
                     vframes.push_back(std::make_shared<VideoFrame>(vframe));
                     ++b;
                 } else {
-                    if (terminate) {
-                        break;
-                    }
+                    terminate = true;
+                    break;
                 }
             }
 
@@ -188,6 +180,7 @@ void IEGraph::start(GetterFunc getterFunc, PostprocessingFunc postprocessingFunc
             }
             condVarBusyRequests.notify_one();
         }
+        condVarBusyRequests.notify_one(); // notify that there will be no new InferRequests
     });
 }
 
@@ -195,15 +188,21 @@ IEGraph::IEGraph(const InitParams& p):
     perfTimerPreprocess(p.collectStats ? PerfTimer::DefaultIterationsCount : 0),
     perfTimerInfer(p.collectStats ? PerfTimer::DefaultIterationsCount : 0),
     confidenceThreshold(0.5f), batchSize(p.batchSize),
-    modelPath(p.modelPath), weightsPath(p.weightsPath),
+    modelPath(p.modelPath),
     cpuExtensionPath(p.cpuExtPath), cldnnConfigPath(p.cldnnConfigPath),
     printPerfReport(p.reportPerf), deviceName(p.deviceName),
     maxRequests(p.maxRequests) {
     assert(p.maxRequests > 0);
 
+    postLoad = p.postLoadFunc;
     initNetwork(p.deviceName);
 }
 
+bool IEGraph::isRunning() {
+    std::lock_guard<std::mutex> lock(mtxBusyRequests);
+    return !terminate || !busyBatchRequests.empty();
+}
+
 InferenceEngine::SizeVector IEGraph::getInputDims() const {
     assert(!availableRequests.empty());
     auto inputBlob = availableRequests.front()->GetBlob(inputDataBlobName);
@@ -217,8 +216,12 @@ std::vector<std::shared_ptr<VideoFrame> > IEGraph::getBatchData(cv::Size frameSi
     {
         std::unique_lock<std::mutex> lock(mtxBusyRequests);
         condVarBusyRequests.wait(lock, [&]() {
-            return !busyBatchRequests.empty();
+            // wait until the pipeline is stopped or there are new InferRequests
+            return terminate || !busyBatchRequests.empty();
         });
+        if (busyBatchRequests.empty()) {
+            return {}; // woke up because of termination, so leave if nothing to preces
+        }
         vframes = std::move(busyBatchRequests.front().vfPtrVec);
         req = std::move(busyBatchRequests.front().req);
         startTime = std::move(busyBatchRequests.front().startTime);
diff --git a/demos/multichannel_demo/common/graph.hpp b/demos/multi_channel/common/graph.hpp
similarity index 93%
rename from demos/multichannel_demo/common/graph.hpp
rename to demos/multi_channel/common/graph.hpp
index 300c0e650aa..261c9e96785 100644
--- a/demos/multichannel_demo/common/graph.hpp
+++ b/demos/multi_channel/common/graph.hpp
@@ -45,7 +45,6 @@ class IEGraph{
     std::size_t batchSize;
 
     std::string modelPath;
-    std::string weightsPath;
     std::string cpuExtensionPath;
     std::string cldnnConfigPath;
 
@@ -77,6 +76,8 @@ class IEGraph{
     GetterFunc getter;
     using PostprocessingFunc = std::function<std::vector<Detections>(InferenceEngine::InferRequest::Ptr, const std::vector<std::string>&, cv::Size)>;
     PostprocessingFunc postprocessing;
+    using PostLoadFunc = std::function<void (const std::vector<std::string>&, InferenceEngine::CNNNetwork&)>;
+    PostLoadFunc postLoad;
     std::thread getterThread;
 
     void initNetwork(const std::string& deviceName);
@@ -88,16 +89,18 @@ class IEGraph{
         bool collectStats = false;
         bool reportPerf = false;
         std::string modelPath;
-        std::string weightsPath;
         std::string cpuExtPath;
         std::string cldnnConfigPath;
         std::string deviceName;
+        PostLoadFunc postLoadFunc = nullptr;
     };
 
     explicit IEGraph(const InitParams& p);
 
     void start(GetterFunc getterFunc, PostprocessingFunc postprocessingFunc);
 
+    bool isRunning();
+
     InferenceEngine::SizeVector getInputDims() const;
 
     std::vector<std::shared_ptr<VideoFrame>> getBatchData(cv::Size windowSize);
diff --git a/demos/multichannel_demo/common/input.cpp b/demos/multi_channel/common/input.cpp
similarity index 86%
rename from demos/multichannel_demo/common/input.cpp
rename to demos/multi_channel/common/input.cpp
index 14b25e7153d..048139a0a2e 100644
--- a/demos/multichannel_demo/common/input.cpp
+++ b/demos/multi_channel/common/input.cpp
@@ -34,7 +34,7 @@
 
 class VideoSource {
 public:
-    virtual bool init() = 0;
+    virtual bool isRunning() const = 0;
 
     virtual void start() = 0;
 
@@ -142,7 +142,7 @@ class VideoSourceStreamFile : public VideoSource {
 
     VideoStream stream;
 
-    std::atomic_bool terminate = {false};
+    std::atomic_bool running = {false};
     std::atomic_bool is_decoding = {false};
 
     std::mutex mutex;
@@ -170,12 +170,14 @@ class VideoSourceStreamFile : public VideoSource {
         queueSize(queueSize_),
         perfTimer(collectStats_ ? PerfTimer::DefaultIterationsCount : 0) { }
 
-    bool init() { return true; }
+    bool isRunning() const override {
+        return running;
+    }
 
     void start() {
-        terminate = false;
+        running = true;
         workThread = std::thread([&]() {
-            while (!terminate) {
+            while (running) {
                 {
                     cv::Mat frame;
                     {
@@ -203,7 +205,7 @@ class VideoSourceStreamFile : public VideoSource {
 
                     std::unique_lock<std::mutex> lock(mutex);
                     condVar.wait(lock, [&]() {
-                        return !is_decoding && (frameQueue.size() < queueSize || terminate);
+                        return !is_decoding && (frameQueue.size() < queueSize || !running);
                     });
                 }
                 hasFrame.notify_one();
@@ -212,7 +214,7 @@ class VideoSourceStreamFile : public VideoSource {
     }
 
     void stop() {
-        terminate = true;
+        running = false;
         condVar.notify_one();
         if (workThread.joinable()) {
             workThread.join();
@@ -222,13 +224,13 @@ class VideoSourceStreamFile : public VideoSource {
     bool read(VideoFrame& frame)  {
         queue_elem_t elem;
 
-        if (terminate)
+        if (!running)
             return false;
 
         {
             std::unique_lock<std::mutex> lock(mutex);
             hasFrame.wait(lock, [&]() {
-                return !frameQueue.empty() || terminate;
+                return !frameQueue.empty() || !running;
             });
             elem = std::move(frameQueue.front());
             frameQueue.pop();
@@ -236,7 +238,7 @@ class VideoSourceStreamFile : public VideoSource {
         condVar.notify_one();
         frame.frame = std::move(elem.second);
 
-        return elem.first && !terminate;
+        return elem.first && running;
     }
 
     float getAvgReadTime() const {
@@ -249,8 +251,8 @@ class VideoSourceStreamFile : public VideoSource {
 class VideoSourceOCV : public VideoSource {
     PerfTimer perfTimer;
     std::thread workThread;
-    const bool isAsync = false;
-    std::atomic_bool terminate = {false};
+    const bool isAsync;
+    std::atomic_bool running = {true};
     std::string videoName;
 
     std::mutex mutex;
@@ -268,9 +270,6 @@ class VideoSourceOCV : public VideoSource {
     template<bool CollectStats>
     bool readFrame(cv::Mat& frame);
 
-    template<bool CollectStats>
-    bool readFrameImpl(cv::Mat& frame);
-
     template<bool CollectStats>
     void startImpl();
 
@@ -282,7 +281,7 @@ class VideoSourceOCV : public VideoSource {
 
     void start();
 
-    bool init();
+    bool isRunning() const override;
 
     void stop();
 
@@ -331,7 +330,7 @@ class VideoSourceNative : public VideoSource {
 
     void start();
 
-    bool init();
+    bool isRunning() const override;
 
     bool read(VideoFrame& frame);
 
@@ -364,8 +363,7 @@ void VideoSourceNative::start() {
     // nothing
 }
 
-bool VideoSourceNative::init() {
-    // nothing
+bool VideoSourceNative::isRunning() const override {
     return true;
 }
 
@@ -440,38 +438,8 @@ bool isNumeric(const std::string& str) {
 }
 }  // namespace
 
-bool VideoSourceOCV::init() {
-    static std::mutex initMutex;  // HACK: opencv camera init is not thread-safe
-    std::unique_lock<std::mutex> lock(initMutex);
-    bool res = false;
-    if (isNumeric(videoName)) {
-#ifdef __linux__
-        res = source.open("/dev/video" + videoName);
-#else
-        res = source.open(std::stoi(videoName));
-#endif
-    } else {
-        res = source.open(videoName);
-    }
-    if (res) {
-        source.set(cv::CAP_PROP_FOURCC, cv::VideoWriter::fourcc('M', 'J', 'P', 'G'));
-    }
-    return res;
-}
-
 template<bool CollectStats>
 bool VideoSourceOCV::readFrame(cv::Mat& frame) {
-    if (!source.isOpened() && !init()) {
-        return false;
-    }
-    if (!readFrameImpl<CollectStats>(frame)) {
-        return init() && readFrameImpl<CollectStats>(frame);
-    }
-    return true;
-}
-
-template<bool CollectStats>
-bool VideoSourceOCV::readFrameImpl(cv::Mat& frame) {
     if (CollectStats) {
         ScopedTimer st(perfTimer);
         return source.read(frame);
@@ -483,38 +451,40 @@ bool VideoSourceOCV::readFrameImpl(cv::Mat& frame) {
 VideoSourceOCV::VideoSourceOCV(bool async, bool collectStats_,
                          const std::string& name, size_t queueSize_,
                          size_t pollingTimeMSec_, bool realFps_):
-    perfTimer(collectStats_ ? PerfTimer::DefaultIterationsCount : 0),
-    isAsync(async), videoName(name),
-    realFps(realFps_),
-    queueSize(queueSize_),
-    pollingTimeMSec(pollingTimeMSec_) {}
+        perfTimer(collectStats_ ? PerfTimer::DefaultIterationsCount : 0),
+        isAsync(async), videoName(name),
+        realFps(realFps_),
+        queueSize(queueSize_),
+        pollingTimeMSec(pollingTimeMSec_) {
+    if (isNumeric(videoName)) {
+        if (!source.open(std::stoi(videoName))) {
+            throw std::runtime_error("Can't open " + videoName + " with cv::VideoCapture::open(int)");
+        }
+    } else {
+        if (!source.open(videoName)) {
+            throw std::runtime_error("Can't open " + videoName + " with cv::VideoCapture::open(std::string)");
+        }
+    }
+    source.set(cv::CAP_PROP_FOURCC, cv::VideoWriter::fourcc('M', 'J', 'P', 'G'));
+}
 
 VideoSourceOCV::~VideoSourceOCV() {
     stop();
 }
 
+bool VideoSourceOCV::isRunning() const {
+    return running;
+}
+
 template<bool CollectStats>
 void VideoSourceOCV::thread_fn(VideoSourceOCV *vs) {
-    while (!vs->terminate) {
+    while (vs->running) {
         cv::Mat frame;
-        bool result = false;
-        while (!((result = vs->readFrame<CollectStats>(frame)) || vs->terminate)) {
-            std::unique_lock<std::mutex> lock(vs->mutex);
-            if (vs->queue.empty() || vs->queue.back().first) {
-                vs->queue.push({false, frame});
-                lock.unlock();
-                vs->hasFrame.notify_one();
-                lock.lock();
-            }
-            std::chrono::milliseconds timeout(vs->pollingTimeMSec);
-            vs->condVar.wait_for(lock,
-                             timeout,
-                             [&]() {
-                                 return vs->terminate.load();
-                             });
+        const bool result = vs->readFrame<CollectStats>(frame);
+        if (!result) {
+            vs->running = false; // stop() also affects running, so override it only when out of frames
         }
-
-        if (vs->queue.size() < vs->queueSize) {
+        if (vs->queue.size() < vs->queueSize || !result) { // queue has space or source run out of frames
             std::unique_lock<std::mutex> lock(vs->mutex);
             vs->queue.push({result, frame});
         }
@@ -525,7 +495,7 @@ void VideoSourceOCV::thread_fn(VideoSourceOCV *vs) {
 template<bool CollectStats>
 void VideoSourceOCV::startImpl() {
     if (isAsync) {
-        terminate = false;
+        running = true;
         workThread = std::thread(&VideoSourceOCV::thread_fn<CollectStats>, this);
     }
 }
@@ -540,7 +510,7 @@ void VideoSourceOCV::start() {
 
 void VideoSourceOCV::stop() {
     if (isAsync) {
-        terminate = true;
+        running = false;
         condVar.notify_one();
         if (workThread.joinable()) {
             workThread.join();
@@ -550,20 +520,17 @@ void VideoSourceOCV::stop() {
 
 bool VideoSourceOCV::read(cv::Mat& frame) {
     if (isAsync) {
-        size_t count = 0;
-        bool res = false;
+        bool res;
         {
             std::unique_lock<std::mutex> lock(mutex);
             hasFrame.wait(lock, [&]() {
-                return !queue.empty() || terminate;
+                return !queue.empty() || !running;
             });
             res = queue.front().first;
             frame = queue.front().second;
             if (realFps || queue.size() > 1 || queueSize == 1) {
                 queue.pop();
             }
-            count = queue.size();
-            (void)count;
         }
         condVar.notify_one();
         return res;
@@ -608,6 +575,13 @@ VideoSources::~VideoSources() {
     // nothing
 }
 
+bool VideoSources::isRunning() const {
+    // when one of VideoSources will be out of frames, it will stop IEGraph,
+    // so this isRunning() requires that all inputs were running
+    return std::all_of(inputs.begin(), inputs.end(),
+        [](const std::unique_ptr<VideoSource>& input){return input->isRunning();});
+}
+
 void VideoSources::openVideo(const std::string& source, bool native) {
 #ifdef USE_NATIVE_CAMERA_API
     if (native) {
@@ -626,10 +600,10 @@ void VideoSources::openVideo(const std::string& source, bool native) {
         std::unique_ptr<VideoSource> newSrc(new VideoSourceNative(*this, controller, dev, camSettings,
                                                                      queueSize, realFps, collectStats));
         inputs.emplace_back(std::move(newSrc));
+    } else {
 #else
-    if (false) {
+    {
 #endif
-    } else {
 #if defined(USE_LIBVA)
         const std::string extension = ".mjpeg";
         std::unique_ptr<VideoSource> newSrc;
@@ -643,11 +617,7 @@ void VideoSources::openVideo(const std::string& source, bool native) {
         std::unique_ptr<VideoSource> newSrc(new VideoSourceOCV(isAsync, collectStats, source,
                                             queueSize, pollingTimeMSec, realFps));
 #endif
-        if (newSrc->init()) {
-            inputs.emplace_back(std::move(newSrc));
-        } else {
-            throw std::runtime_error("Cannot open cv::VideoCapture");
-        }
+        inputs.emplace_back(std::move(newSrc));
     }
 }
 
diff --git a/demos/multichannel_demo/common/input.hpp b/demos/multi_channel/common/input.hpp
similarity index 92%
rename from demos/multichannel_demo/common/input.hpp
rename to demos/multi_channel/common/input.hpp
index 413ee022b26..779cc825e05 100644
--- a/demos/multichannel_demo/common/input.hpp
+++ b/demos/multi_channel/common/input.hpp
@@ -40,7 +40,7 @@ class VideoFrame final {
     Detections detections;
     VideoFrame() = default;
 
-    void operator =(VideoFrame const& vf) = delete;
+    VideoFrame& operator =(VideoFrame const& vf) = delete;
 };
 
 class VideoSource;
@@ -58,8 +58,8 @@ class VideoSources {
     std::mutex decode_mutex;  // hardware decoding enqueue lock
 
     std::vector<std::unique_ptr<VideoSource>> inputs;
-    const bool isAsync = false;
-    const bool collectStats = false;
+    const bool isAsync;
+    const bool collectStats;
 
     bool realFps;
 
@@ -90,6 +90,8 @@ class VideoSources {
 
     void start();
 
+    virtual bool isRunning() const;
+
     bool getFrame(size_t index, VideoFrame& frame);
 
     struct Stats {
diff --git a/demos/multichannel_demo/common/multicam/CMakeLists.txt b/demos/multi_channel/common/multicam/CMakeLists.txt
similarity index 100%
rename from demos/multichannel_demo/common/multicam/CMakeLists.txt
rename to demos/multi_channel/common/multicam/CMakeLists.txt
diff --git a/demos/multichannel_demo/common/multicam/camera.cpp b/demos/multi_channel/common/multicam/camera.cpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/camera.cpp
rename to demos/multi_channel/common/multicam/camera.cpp
diff --git a/demos/multichannel_demo/common/multicam/camera.hpp b/demos/multi_channel/common/multicam/camera.hpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/camera.hpp
rename to demos/multi_channel/common/multicam/camera.hpp
diff --git a/demos/multichannel_demo/common/multicam/controller.cpp b/demos/multi_channel/common/multicam/controller.cpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/controller.cpp
rename to demos/multi_channel/common/multicam/controller.cpp
diff --git a/demos/multichannel_demo/common/multicam/controller.hpp b/demos/multi_channel/common/multicam/controller.hpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/controller.hpp
rename to demos/multi_channel/common/multicam/controller.hpp
diff --git a/demos/multichannel_demo/common/multicam/utils.cpp b/demos/multi_channel/common/multicam/utils.cpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/utils.cpp
rename to demos/multi_channel/common/multicam/utils.cpp
diff --git a/demos/multichannel_demo/common/multicam/utils.hpp b/demos/multi_channel/common/multicam/utils.hpp
similarity index 100%
rename from demos/multichannel_demo/common/multicam/utils.hpp
rename to demos/multi_channel/common/multicam/utils.hpp
diff --git a/demos/multi_channel/common/multichannel_params.hpp b/demos/multi_channel/common/multichannel_params.hpp
new file mode 100644
index 00000000000..471e3bff9eb
--- /dev/null
+++ b/demos/multi_channel/common/multichannel_params.hpp
@@ -0,0 +1,51 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+#include <vector>
+#include <gflags/gflags.h>
+
+static const char help_message[] = "Print a usage message";
+static const char model_path_message[] = "Required. Path to an .xml file with a trained model.";
+static const char target_device_message[] = "Optional. Specify the target device for a network (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo looks for a suitable plugin for a specified device.";
+static const char performance_counter_message[] = "Optional. Enable per-layer performance report";
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to an .xml file with the kernels descriptions";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementations";
+static const char no_show_processed_video[] = "Optional. Do not show processed video.";
+static const char num_cameras[] = "Optional. Maximum number of processed camera inputs (web cameras)";
+static const char batch_size[] = "Optional. Batch size for processing (the number of frames processed per infer request)";
+static const char num_infer_requests[] = "Optional. Number of infer requests";
+static const char input_queue_size[] = "Optional. Frame queue size for input channels";
+static const char fps_sampling_period[] = "Optional. FPS measurement sampling period between timepoints in msec";
+static const char num_sampling_periods[] = "Optional. Number of sampling periods";
+static const char show_statistics[] = "Optional. Enable statistics report";
+static const char duplication_channel_number[] = "Optional. Enable and specify the number of channels additionally copied from real sources";
+static const char real_input_fps[] = "Optional. Disable input frames caching, for maximum throughput pipeline";
+static const char input_video[] = "Optional. Specify full path to input video files";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
+
+DEFINE_bool(h, false, help_message);
+DEFINE_string(m, "", model_path_message);
+DEFINE_string(d, "CPU", target_device_message);
+DEFINE_bool(pc, false, performance_counter_message);
+DEFINE_string(c, "", custom_cldnn_message);
+DEFINE_string(l, "", custom_cpu_library_message);
+DEFINE_bool(no_show, false, no_show_processed_video);
+DEFINE_uint32(nc, 0, num_cameras);
+DEFINE_uint32(bs, 1, batch_size);
+DEFINE_uint32(nireq, 5, num_infer_requests);
+DEFINE_uint32(n_iqs, 5, input_queue_size);
+DEFINE_uint32(fps_sp, 1000, fps_sampling_period);
+DEFINE_uint32(n_sp, 10, num_sampling_periods);
+DEFINE_bool(show_stats, false, show_statistics);
+DEFINE_uint32(duplicate_num, 0, duplication_channel_number);
+DEFINE_bool(real_input_fps, false, real_input_fps);
+DEFINE_string(i, "", input_video);
+DEFINE_string(u, "", utilization_monitors_message);
diff --git a/demos/multichannel_demo/common/output.cpp b/demos/multi_channel/common/output.cpp
similarity index 98%
rename from demos/multichannel_demo/common/output.cpp
rename to demos/multi_channel/common/output.cpp
index 4aec97fdf6e..3e0c1e8da12 100644
--- a/demos/multichannel_demo/common/output.cpp
+++ b/demos/multi_channel/common/output.cpp
@@ -40,7 +40,7 @@ void AsyncOutput::start() {
             condVar.wait(lock, [&]() {
                 return !queue.empty() || terminate;
             });
-            if (terminate) {
+            if (queue.empty()) {
                 break;
             }
 
@@ -62,7 +62,6 @@ void AsyncOutput::start() {
     });
 }
 
-
 bool AsyncOutput::isAlive() const {
     return !terminate;
 }
diff --git a/demos/multichannel_demo/common/output.hpp b/demos/multi_channel/common/output.hpp
similarity index 100%
rename from demos/multichannel_demo/common/output.hpp
rename to demos/multi_channel/common/output.hpp
diff --git a/demos/multichannel_demo/common/perf_timer.cpp b/demos/multi_channel/common/perf_timer.cpp
similarity index 100%
rename from demos/multichannel_demo/common/perf_timer.cpp
rename to demos/multi_channel/common/perf_timer.cpp
diff --git a/demos/multichannel_demo/common/perf_timer.hpp b/demos/multi_channel/common/perf_timer.hpp
similarity index 100%
rename from demos/multichannel_demo/common/perf_timer.hpp
rename to demos/multi_channel/common/perf_timer.hpp
diff --git a/demos/multichannel_demo/common/threading.cpp b/demos/multi_channel/common/threading.cpp
similarity index 100%
rename from demos/multichannel_demo/common/threading.cpp
rename to demos/multi_channel/common/threading.cpp
diff --git a/demos/multichannel_demo/common/threading.hpp b/demos/multi_channel/common/threading.hpp
similarity index 100%
rename from demos/multichannel_demo/common/threading.hpp
rename to demos/multi_channel/common/threading.hpp
diff --git a/demos/multichannel_demo/fd/CMakeLists.txt b/demos/multi_channel/face_detection_demo/CMakeLists.txt
similarity index 90%
rename from demos/multichannel_demo/fd/CMakeLists.txt
rename to demos/multi_channel/face_detection_demo/CMakeLists.txt
index fac14a84a1d..5b497fcf401 100644
--- a/demos/multichannel_demo/fd/CMakeLists.txt
+++ b/demos/multi_channel/face_detection_demo/CMakeLists.txt
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-set(TARGET_NAME "multi-channel-face-detection-demo")
+set(TARGET_NAME "multi_channel_face_detection_demo")
 
 if( BUILD_DEMO_NAME AND NOT ${BUILD_DEMO_NAME} STREQUAL ${TARGET_NAME} )
     message(STATUS "DEMO ${TARGET_NAME} SKIPPED")
@@ -60,16 +60,8 @@ if(MULTICHANNEL_DEMO_USE_TBB)
     endif()
 endif()
 
-if(TARGET IE::ie_cpu_extension)
-    add_definitions(-DWITH_EXTENSIONS)
-endif()
-
 target_link_libraries(${TARGET_NAME} ${InferenceEngine_LIBRARIES} gflags ${OpenCV_LIBRARIES} common)
 
-if(TARGET IE::ie_cpu_extension)
-    target_link_libraries(${TARGET_NAME} IE::ie_cpu_extension)
-endif()
-
 if(UNIX)
     target_link_libraries( ${TARGET_NAME} pthread)
 endif()
@@ -83,3 +75,5 @@ if(NOT TARGET ie_samples)
 endif()
 
 add_dependencies(ie_samples ${TARGET_NAME})
+
+target_link_libraries(${TARGET_NAME} monitors)
diff --git a/demos/multichannel_demo/fd/README.md b/demos/multi_channel/face_detection_demo/README.md
similarity index 93%
rename from demos/multichannel_demo/fd/README.md
rename to demos/multi_channel/face_detection_demo/README.md
index cb3d6a005b5..85c38892f36 100644
--- a/demos/multichannel_demo/fd/README.md
+++ b/demos/multi_channel/face_detection_demo/README.md
@@ -22,10 +22,10 @@ On the start-up, the application reads command line parameters and loads the spe
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
-./multi-channel-face-detection-demo -h
+```
+./multi_channel_face_detection_demo -h
 
-multi-channel-face-detection-demo [OPTION]
+multi_channel_face_detection_demo [OPTION]
 Options:
 
     -h                           Print a usage message
@@ -47,7 +47,7 @@ Options:
     -duplicate_num               Optional. Enable and specify the number of channels additionally copied from real sources
     -real_input_fps              Optional. Disable input frames caching for maximum throughput pipeline
     -i                           Optional. Specify full path to input video files
-
+    -u                           Optional. List of monitors to show initially.
 ```
 
 To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
@@ -56,14 +56,12 @@ To run the demo, you can use public or pre-trained models. To download the pre-t
 
 For example, to run the demo with the pre-trained face detection model on FPGA with fallback on CPU, with one single camera, use the following command:
 ```sh
-./multi-channel-face-detection-demo -m face-detection-retail-0004.xml
--l <demos_build_folder>/intel64/Release/lib/libcpu_extension.so -d HETERO:FPGA,CPU -nc 1
+./multi_channel_face_detection_demo -m face-detection-retail-0004.xml -d HETERO:FPGA,CPU -nc 1
 ```
 
 To run the demo using two recorded video files, use the following command:
 ```sh
-./multi-channel-face-detection-demo -m face-detection-retail-0004.xml
--l <demos_build_folder>/intel64/Release/lib/libcpu_extension.so -d HETERO:FPGA,CPU -i /path/to/file1 /path/to/file2
+./multi_channel_face_detection_demo -m face-detection-retail-0004.xml -d HETERO:FPGA,CPU -i /path/to/file1 /path/to/file2
 ```
 Video files will be processed repeatedly.
 
@@ -87,7 +85,7 @@ General parameter for input video source is `-i`. Use it to specify video files
 
 To see all available web cameras, run the `ls /dev/video*` command. You will get output similar to the following:
 
-```sh
+```
 user@user-PC:~ $ ls /dev/video*
 /dev/video0  /dev/video1  /dev/video2
 ```
@@ -102,7 +100,7 @@ Alternatively, you can just set `-nc 3`, which simplifies application usage.
 
 If your cameras are connected to PC with indexes gap (for example, `0,1,3`), use the `-i` parameter.
 
-IP сameras support:
+IP cameras support:
 ```
 -i rtsp://camera_address_1/ rtsp://camera_address_2/
 ```
diff --git a/demos/multichannel_demo/fd/main.cpp b/demos/multi_channel/face_detection_demo/main.cpp
similarity index 92%
rename from demos/multichannel_demo/fd/main.cpp
rename to demos/multi_channel/face_detection_demo/main.cpp
index 7f2ebd8fc4f..2996cfbe4a3 100644
--- a/demos/multichannel_demo/fd/main.cpp
+++ b/demos/multi_channel/face_detection_demo/main.cpp
@@ -27,8 +27,8 @@
 
 #include <opencv2/opencv.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/slog.hpp>
-
 #include <samples/args_helper.hpp>
 
 #include "input.hpp"
@@ -45,11 +45,11 @@ namespace {
 */
 void showUsage() {
     std::cout << std::endl;
-    std::cout << "multichannel_face_detection [OPTION]" << std::endl;
+    std::cout << "multi_channel_face_detection_demo [OPTION]" << std::endl;
     std::cout << "Options:" << std::endl;
     std::cout << std::endl;
     std::cout << "    -h                           " << help_message << std::endl;
-    std::cout << "    -m \"<path>\"                  " << face_detection_model_message<< std::endl;
+    std::cout << "    -m \"<path>\"                  " << model_path_message<< std::endl;
     std::cout << "      -l \"<absolute_path>\"       " << custom_cpu_library_message << std::endl;
     std::cout << "          Or" << std::endl;
     std::cout << "      -c \"<absolute_path>\"       " << custom_cldnn_message << std::endl;
@@ -67,6 +67,7 @@ void showUsage() {
     std::cout << "    -duplicate_num               " << duplication_channel_number << std::endl;
     std::cout << "    -real_input_fps              " << real_input_fps << std::endl;
     std::cout << "    -i                           " << input_video << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
 }
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
@@ -109,7 +110,7 @@ struct Face {
     Face(cv::Rect2f r, float c, unsigned char a, unsigned char g): rect(r), confidence(c), age(a), gender(g) {}
 };
 
-void drawDetections(cv::Mat& img, const std::vector<Face> detections) {
+void drawDetections(cv::Mat& img, const std::vector<Face>& detections) {
     for (const Face& f : detections) {
         cv::Rect ri(static_cast<int>(f.rect.x*img.cols), static_cast<int>(f.rect.y*img.rows),
                     static_cast<int>(f.rect.width*img.cols), static_cast<int>(f.rect.height*img.rows));
@@ -151,7 +152,8 @@ DisplayParams prepareDisplayParams(size_t count) {
 void displayNSources(const std::vector<std::shared_ptr<VideoFrame>>& data,
                      float time,
                      const std::string& stats,
-                     DisplayParams params) {
+                     DisplayParams params,
+                     Presenter& presenter) {
     cv::Mat windowImage = cv::Mat::zeros(params.windowSize, CV_8UC3);
     auto loopBody = [&](size_t i) {
         auto& elem = data[i];
@@ -192,6 +194,7 @@ void displayNSources(const std::vector<std::shared_ptr<VideoFrame>>& data,
         loopBody(i);
     }
 #endif
+    presenter.drawGraphs(windowImage);
     drawStats();
 
     char str[256];
@@ -214,7 +217,6 @@ int main(int argc, char* argv[]) {
             return 0;
         }
 
-        std::string weightsPath;
         std::string modelPath = FLAGS_m;
         std::size_t found = modelPath.find_last_of(".");
         if (found > modelPath.size()) {
@@ -222,9 +224,7 @@ int main(int argc, char* argv[]) {
             slog::info << "Expected to be <model_name>.xml" << slog::endl;
             return -1;
         }
-        weightsPath = modelPath.substr(0, found) + ".bin";
         slog::info << "Model   path: " << modelPath << slog::endl;
-        slog::info << "Weights path: " << weightsPath << slog::endl;
 
         IEGraph::InitParams graphParams;
         graphParams.batchSize       = FLAGS_bs;
@@ -232,7 +232,6 @@ int main(int argc, char* argv[]) {
         graphParams.collectStats    = FLAGS_show_stats;
         graphParams.reportPerf      = FLAGS_pc;
         graphParams.modelPath       = modelPath;
-        graphParams.weightsPath     = weightsPath;
         graphParams.cpuExtPath      = FLAGS_l;
         graphParams.cldnnConfigPath = FLAGS_c;
         graphParams.deviceName      = FLAGS_d;
@@ -346,6 +345,9 @@ int main(int argc, char* argv[]) {
         }
         std::cout << std::endl;
 
+        cv::Size graphSize{static_cast<int>(params.windowSize.width / 4), 60};
+        Presenter presenter(FLAGS_u, params.windowSize.height - graphSize.height - 10, graphSize);
+
         const size_t outputQueueSize = 1;
         AsyncOutput output(FLAGS_show_stats, outputQueueSize,
         [&](const std::vector<std::shared_ptr<VideoFrame>>& result) {
@@ -354,9 +356,11 @@ int main(int argc, char* argv[]) {
                 std::unique_lock<std::mutex> lock(statMutex);
                 str = statStream.str();
             }
-            displayNSources(result, averageFps, str, params);
+            displayNSources(result, averageFps, str, params, presenter);
+            int key = cv::waitKey(1);
+            presenter.handleKey(key);
 
-            return (cv::waitKey(1) != 27);
+            return (key != 27);
         });
 
         output.start();
@@ -370,11 +374,16 @@ int main(int argc, char* argv[]) {
 
         size_t perfItersCounter = 0;
 
-        while (true) {
+        while (sources.isRunning() || network->isRunning()) {
             bool readData = true;
             while (readData) {
                 auto br = network->getBatchData(params.frameSize);
+                if (br.empty()) {
+                    break; // IEGraph::getBatchData had nothing to process and returned. That means it was stopped
+                }
                 for (size_t i = 0; i < br.size(); i++) {
+                    // this approach waits for the next input image for sourceIdx. If provided a single image,
+                    // it may not show results, especially if -real_input_fps is enabled
                     auto val = static_cast<unsigned int>(br[i]->sourceIdx);
                     auto it = find_if(batchRes.begin(), batchRes.end(), [val] (const std::shared_ptr<VideoFrame>& vf) { return vf->sourceIdx == val; } );
                     if (it != batchRes.end()) {
@@ -448,6 +457,8 @@ int main(int argc, char* argv[]) {
         }
 
         network.reset();
+
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         slog::err << error.what() << slog::endl;
diff --git a/demos/multichannel_demo/models.lst b/demos/multi_channel/face_detection_demo/models.lst
similarity index 85%
rename from demos/multichannel_demo/models.lst
rename to demos/multi_channel/face_detection_demo/models.lst
index 205180adf86..b08884eca53 100644
--- a/demos/multichannel_demo/models.lst
+++ b/demos/multi_channel/face_detection_demo/models.lst
@@ -2,4 +2,3 @@
 face-detection-adas-????
 face-detection-adas-binary-????
 face-detection-retail-????
-human-pose-estimation-????
diff --git a/demos/multichannel_demo/fd/multichannel_face_detection_params.hpp b/demos/multi_channel/face_detection_demo/multichannel_face_detection_params.hpp
similarity index 64%
rename from demos/multichannel_demo/fd/multichannel_face_detection_params.hpp
rename to demos/multi_channel/face_detection_demo/multichannel_face_detection_params.hpp
index 9de1ad57da9..b4ef8ee7ec2 100644
--- a/demos/multichannel_demo/fd/multichannel_face_detection_params.hpp
+++ b/demos/multi_channel/face_detection_demo/multichannel_face_detection_params.hpp
@@ -8,9 +8,6 @@
 #include <vector>
 #include <gflags/gflags.h>
 
-/// @brief message for probability threshold argument
 static const char thresh_output_message[] = "Optional. Probability threshold for detections";
 
-/// \brief Flag to output raw scoring results<br>
-/// It is an optional parameter. Ignored for human-pose-estimation
 DEFINE_double(t, 0.5, thresh_output_message);
diff --git a/demos/multichannel_demo/hpe/CMakeLists.txt b/demos/multi_channel/human_pose_estimation_demo/CMakeLists.txt
similarity index 90%
rename from demos/multichannel_demo/hpe/CMakeLists.txt
rename to demos/multi_channel/human_pose_estimation_demo/CMakeLists.txt
index 4789bcd36b1..7fe48237dda 100644
--- a/demos/multichannel_demo/hpe/CMakeLists.txt
+++ b/demos/multi_channel/human_pose_estimation_demo/CMakeLists.txt
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-set(TARGET_NAME "multi-channel-human-pose-estimation-demo")
+set(TARGET_NAME "multi_channel_human_pose_estimation_demo")
 
 if( BUILD_DEMO_NAME AND NOT ${BUILD_DEMO_NAME} STREQUAL ${TARGET_NAME} )
     message(STATUS "DEMO ${TARGET_NAME} SKIPPED")
@@ -60,13 +60,7 @@ if(MULTICHANNEL_DEMO_USE_TBB)
     endif()
 endif()
 
-if(TARGET IE::ie_cpu_extension)
-    add_definitions(-DWITH_EXTENSIONS)
-endif()
 target_link_libraries(${TARGET_NAME} ${InferenceEngine_LIBRARIES} gflags ${OpenCV_LIBRARIES} common)
-if(TARGET IE::ie_cpu_extension)
-    target_link_libraries(${TARGET_NAME} IE::ie_cpu_extension)
-endif()
 
 if(UNIX)
     target_link_libraries( ${TARGET_NAME} pthread)
@@ -81,3 +75,5 @@ if(COMMAND add_cpplint_target)
 endif()
 
 add_dependencies(ie_samples ${TARGET_NAME})
+
+target_link_libraries(${TARGET_NAME} monitors)
diff --git a/demos/multichannel_demo/hpe/README.md b/demos/multi_channel/human_pose_estimation_demo/README.md
similarity index 92%
rename from demos/multichannel_demo/hpe/README.md
rename to demos/multi_channel/human_pose_estimation_demo/README.md
index bec055f1d54..06922caf992 100644
--- a/demos/multichannel_demo/hpe/README.md
+++ b/demos/multi_channel/human_pose_estimation_demo/README.md
@@ -22,9 +22,9 @@ On the start-up, the application reads command line parameters and loads the spe
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
-./multi-channel-human-pose-estimation-demo -h
-multi-channel-human-pose-estimation-demo [OPTION]
+```
+./multi_channel_human_pose_estimation_demo -h
+multi_channel_human_pose_estimation_demo [OPTION]
 Options:
     -h                           Print a usage message
     -m "<path>"                  Required. Path to an .xml file with a trained model.
@@ -44,6 +44,7 @@ Options:
     -duplicate_num               Optional. Enable and specify the number of channels additionally copied from real sources
     -real_input_fps              Optional. Disable input frames caching for maximum throughput pipeline
     -i "<absolute_path>"         Optional. Specify a full path to input video files
+    -u                           Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields the usage message given above and an error message.
@@ -54,14 +55,12 @@ To run the demo, you can use public or pre-trained models. To download the pre-t
 
 For example, to run the demo with the pre-trained Human Pose Estimation model on FPGA with fallback on CPU with one camera, use the following command:
 ```sh
-./multi-channel-human-pose-estimation-demo -m <path_to_model>/human-pose-estimation-0001.xml
--l <demos_build_folder>/intel64/Release/lib/libcpu_extension.so -d HETERO:FPGA,CPU -nc 1
+./multi_channel_human_pose_estimation_demo -m <path_to_model>/human-pose-estimation-0001.xml -d HETERO:FPGA,CPU -nc 1
 ```
 
 To run the demo using two recorded video files, use the following command:
 ```sh
-./multi-channel-human-pose-estimation-demo -m <path_to_model>/human-pose-estimation-0001.xml
--l <demos_build_folder>/intel64/Release/lib/libcpu_extension.so -d HETERO:FPGA,CPU -i /path/to/file1 /path/to/file2
+./multi_channel_human_pose_estimation_demo -m <path_to_model>/human-pose-estimation-0001.xml -d HETERO:FPGA,CPU -i /path/to/file1 /path/to/file2
 ```
 
 Video files will be processed repeatedly.
@@ -86,7 +85,7 @@ General parameter for input video source is `-i`. Use it to specify video files
 
 To see all available web cameras, run the `ls /dev/video*` command. You will get output similar to the following:
 
-```sh
+```
 user@user-PC:~ $ ls /dev/video*
 /dev/video0  /dev/video1  /dev/video2
 ```
diff --git a/demos/multichannel_demo/hpe/human_pose.cpp b/demos/multi_channel/human_pose_estimation_demo/human_pose.cpp
similarity index 100%
rename from demos/multichannel_demo/hpe/human_pose.cpp
rename to demos/multi_channel/human_pose_estimation_demo/human_pose.cpp
diff --git a/demos/multichannel_demo/hpe/human_pose.hpp b/demos/multi_channel/human_pose_estimation_demo/human_pose.hpp
similarity index 100%
rename from demos/multichannel_demo/hpe/human_pose.hpp
rename to demos/multi_channel/human_pose_estimation_demo/human_pose.hpp
diff --git a/demos/multichannel_demo/hpe/main.cpp b/demos/multi_channel/human_pose_estimation_demo/main.cpp
similarity index 93%
rename from demos/multichannel_demo/hpe/main.cpp
rename to demos/multi_channel/human_pose_estimation_demo/main.cpp
index a6fd3e5457c..b7ebd07fbd2 100644
--- a/demos/multichannel_demo/hpe/main.cpp
+++ b/demos/multi_channel/human_pose_estimation_demo/main.cpp
@@ -38,8 +38,8 @@
 
 #include <opencv2/opencv.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/slog.hpp>
-
 #include <samples/args_helper.hpp>
 
 #include "input.hpp"
@@ -61,11 +61,11 @@ namespace {
 */
 void showUsage() {
     std::cout << std::endl;
-    std::cout << "multi-channel-human-pose-estimation-demo [OPTION]" << std::endl;
+    std::cout << "multi_channel_human_pose_estimation_demo [OPTION]" << std::endl;
     std::cout << "Options:" << std::endl;
     std::cout << std::endl;
     std::cout << "    -h                           " << help_message << std::endl;
-    std::cout << "    -m \"<path>\"                  " << face_detection_model_message<< std::endl;
+    std::cout << "    -m \"<path>\"                  " << model_path_message<< std::endl;
     std::cout << "      -l \"<absolute_path>\"       " << custom_cpu_library_message << std::endl;
     std::cout << "          Or" << std::endl;
     std::cout << "      -c \"<absolute_path>\"       " << custom_cldnn_message << std::endl;
@@ -82,6 +82,7 @@ void showUsage() {
     std::cout << "    -duplicate_num               " << duplication_channel_number << std::endl;
     std::cout << "    -real_input_fps              " << real_input_fps << std::endl;
     std::cout << "    -i                           " << input_video << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
 }
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
@@ -149,7 +150,8 @@ DisplayParams prepareDisplayParams(size_t count) {
 void displayNSources(const std::vector<std::shared_ptr<VideoFrame>>& data,
                      float time,
                      const std::string& stats,
-                     DisplayParams params) {
+                     DisplayParams params,
+                     Presenter& presenter) {
     cv::Mat windowImage = cv::Mat::zeros(params.windowSize, CV_8UC3);
     auto loopBody = [&](size_t i) {
         auto& elem = data[i];
@@ -190,6 +192,7 @@ void displayNSources(const std::vector<std::shared_ptr<VideoFrame>>& data,
         loopBody(i);
     }
 #endif
+    presenter.drawGraphs(windowImage);
     drawStats();
 
     char str[256];
@@ -212,7 +215,6 @@ int main(int argc, char* argv[]) {
             return 0;
         }
 
-        std::string weightsPath;
         std::string modelPath = FLAGS_m;
         std::size_t found = modelPath.find_last_of(".");
         if (found > modelPath.size()) {
@@ -220,9 +222,7 @@ int main(int argc, char* argv[]) {
             slog::info << "Expected to be <model_name>.xml" << slog::endl;
             return -1;
         }
-        weightsPath = modelPath.substr(0, found) + ".bin";
         slog::info << "Model   path: " << modelPath << slog::endl;
-        slog::info << "Weights path: " << weightsPath << slog::endl;
 
         IEGraph::InitParams graphParams;
         graphParams.batchSize       = FLAGS_bs;
@@ -230,7 +230,6 @@ int main(int argc, char* argv[]) {
         graphParams.collectStats    = FLAGS_show_stats;
         graphParams.reportPerf      = FLAGS_pc;
         graphParams.modelPath       = modelPath;
-        graphParams.weightsPath     = weightsPath;
         graphParams.cpuExtPath      = FLAGS_l;
         graphParams.cldnnConfigPath = FLAGS_c;
         graphParams.deviceName      = FLAGS_d;
@@ -344,6 +343,9 @@ int main(int argc, char* argv[]) {
         }
         std::cout << std::endl;
 
+        cv::Size graphSize{static_cast<int>(params.windowSize.width / 4), 60};
+        Presenter presenter(FLAGS_u, params.windowSize.height - graphSize.height - 10, graphSize);
+
         const size_t outputQueueSize = 1;
         AsyncOutput output(FLAGS_show_stats, outputQueueSize,
         [&](const std::vector<std::shared_ptr<VideoFrame>>& result) {
@@ -352,9 +354,11 @@ int main(int argc, char* argv[]) {
                 std::unique_lock<std::mutex> lock(statMutex);
                 str = statStream.str();
             }
-            displayNSources(result, averageFps, str, params);
+            displayNSources(result, averageFps, str, params, presenter);
+            int key = cv::waitKey(1);
+            presenter.handleKey(key);
 
-            return (cv::waitKey(1) != 27);
+            return (key != 27);
         });
 
         output.start();
@@ -368,11 +372,16 @@ int main(int argc, char* argv[]) {
 
         size_t perfItersCounter = 0;
 
-        while (true) {
+        while (sources.isRunning() || network->isRunning()) {
             bool readData = true;
             while (readData) {
                 auto br = network->getBatchData(params.frameSize);
+                if (br.empty()) {
+                    break; // IEGraph::getBatchData had nothing to process and returned. That means it was stopped
+                }
                 for (size_t i = 0; i < br.size(); i++) {
+                    // this approach waits for the next input image for sourceIdx. If provided a single image,
+                    // it may not show results, especially if -real_input_fps is enabled
                     auto val = static_cast<unsigned int>(br[i]->sourceIdx);
                     auto it = find_if(batchRes.begin(), batchRes.end(), [val] (const std::shared_ptr<VideoFrame>& vf) { return vf->sourceIdx == val; } );
                     if (it != batchRes.end()) {
@@ -446,6 +455,8 @@ int main(int argc, char* argv[]) {
         }
 
         network.reset();
+
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         slog::err << error.what() << slog::endl;
diff --git a/demos/multi_channel/human_pose_estimation_demo/models.lst b/demos/multi_channel/human_pose_estimation_demo/models.lst
new file mode 100644
index 00000000000..26d650bc499
--- /dev/null
+++ b/demos/multi_channel/human_pose_estimation_demo/models.lst
@@ -0,0 +1,2 @@
+# This file can be used with the --list option of the model downloader.
+human-pose-estimation-????
diff --git a/demos/multichannel_demo/hpe/peak.cpp b/demos/multi_channel/human_pose_estimation_demo/peak.cpp
similarity index 98%
rename from demos/multichannel_demo/hpe/peak.cpp
rename to demos/multi_channel/human_pose_estimation_demo/peak.cpp
index 4ffdc7a7594..51b423c1c2b 100644
--- a/demos/multichannel_demo/hpe/peak.cpp
+++ b/demos/multi_channel/human_pose_estimation_demo/peak.cpp
@@ -18,6 +18,8 @@
 #include <utility>
 #include <vector>
 
+#include <samples/common.hpp>
+
 #include "peak.hpp"
 
 Peak::Peak(const int id, const cv::Point2f& pos, const float score)
@@ -123,11 +125,11 @@ std::vector<HumanPose> groupPeaksToPoses(const std::vector<std::vector<Peak> >&
                                          const float foundMidPointsRatioThreshold,
                                          const int minJointsNumber,
                                          const float minSubsetScore) {
-    const std::vector<std::pair<int, int> > limbIdsHeatmap = {
+    static const std::pair<int, int> limbIdsHeatmap[] = {
         {2, 3}, {2, 6}, {3, 4}, {4, 5}, {6, 7}, {7, 8}, {2, 9}, {9, 10}, {10, 11}, {2, 12}, {12, 13}, {13, 14},
         {2, 1}, {1, 15}, {15, 17}, {1, 16}, {16, 18}, {3, 17}, {6, 18}
     };
-    const std::vector<std::pair<int, int> > limbIdsPaf = {
+    static const std::pair<int, int> limbIdsPaf[] = {
         {31, 32}, {39, 40}, {33, 34}, {35, 36}, {41, 42}, {43, 44}, {19, 20}, {21, 22}, {23, 24}, {25, 26},
         {27, 28}, {29, 30}, {47, 48}, {49, 50}, {53, 54}, {51, 52}, {55, 56}, {37, 38}, {45, 46}
     };
@@ -137,7 +139,7 @@ std::vector<HumanPose> groupPeaksToPoses(const std::vector<std::vector<Peak> >&
          candidates.insert(candidates.end(), peaks.begin(), peaks.end());
     }
     std::vector<HumanPoseByPeaksIndices> subset(0, HumanPoseByPeaksIndices(keypointsNumber));
-    for (size_t k = 0; k < limbIdsPaf.size(); k++) {
+    for (size_t k = 0; k < arraySize(limbIdsPaf); k++) {
         std::vector<TwoJointsConnection> connections;
         const int mapIdxOffset = keypointsNumber + 1;
         std::pair<cv::Mat, cv::Mat> scoreMid = { pafs[limbIdsPaf[k].first - mapIdxOffset],
diff --git a/demos/multichannel_demo/hpe/peak.hpp b/demos/multi_channel/human_pose_estimation_demo/peak.hpp
similarity index 100%
rename from demos/multichannel_demo/hpe/peak.hpp
rename to demos/multi_channel/human_pose_estimation_demo/peak.hpp
diff --git a/demos/multichannel_demo/hpe/postprocess.cpp b/demos/multi_channel/human_pose_estimation_demo/postprocess.cpp
similarity index 100%
rename from demos/multichannel_demo/hpe/postprocess.cpp
rename to demos/multi_channel/human_pose_estimation_demo/postprocess.cpp
diff --git a/demos/multichannel_demo/hpe/postprocess.hpp b/demos/multi_channel/human_pose_estimation_demo/postprocess.hpp
similarity index 100%
rename from demos/multichannel_demo/hpe/postprocess.hpp
rename to demos/multi_channel/human_pose_estimation_demo/postprocess.hpp
diff --git a/demos/multichannel_demo/hpe/postprocessor.cpp b/demos/multi_channel/human_pose_estimation_demo/postprocessor.cpp
similarity index 100%
rename from demos/multichannel_demo/hpe/postprocessor.cpp
rename to demos/multi_channel/human_pose_estimation_demo/postprocessor.cpp
diff --git a/demos/multichannel_demo/hpe/postprocessor.hpp b/demos/multi_channel/human_pose_estimation_demo/postprocessor.hpp
similarity index 100%
rename from demos/multichannel_demo/hpe/postprocessor.hpp
rename to demos/multi_channel/human_pose_estimation_demo/postprocessor.hpp
diff --git a/demos/multichannel_demo/hpe/render_human_pose.cpp b/demos/multi_channel/human_pose_estimation_demo/render_human_pose.cpp
similarity index 95%
rename from demos/multichannel_demo/hpe/render_human_pose.cpp
rename to demos/multi_channel/human_pose_estimation_demo/render_human_pose.cpp
index 4ddf4744da0..4ecf53ca5d3 100644
--- a/demos/multichannel_demo/hpe/render_human_pose.cpp
+++ b/demos/multi_channel/human_pose_estimation_demo/render_human_pose.cpp
@@ -19,12 +19,13 @@
 
 #include <opencv2/imgproc/imgproc.hpp>
 
+#include "postprocess.hpp"
 #include "render_human_pose.hpp"
 
 void renderHumanPose(const std::vector<HumanPose>& poses, cv::Mat& image) {
     CV_Assert(image.type() == CV_8UC3);
 
-    const std::vector<cv::Scalar> colors = {
+    static const cv::Scalar colors[keypointsNumber] = {
         cv::Scalar(255, 0, 0), cv::Scalar(255, 85, 0), cv::Scalar(255, 170, 0),
         cv::Scalar(255, 255, 0), cv::Scalar(170, 255, 0), cv::Scalar(85, 255, 0),
         cv::Scalar(0, 255, 0), cv::Scalar(0, 255, 85), cv::Scalar(0, 255, 170),
@@ -32,7 +33,7 @@ void renderHumanPose(const std::vector<HumanPose>& poses, cv::Mat& image) {
         cv::Scalar(0, 0, 255), cv::Scalar(85, 0, 255), cv::Scalar(170, 0, 255),
         cv::Scalar(255, 0, 255), cv::Scalar(255, 0, 170), cv::Scalar(255, 0, 85)
     };
-    const std::vector<std::pair<int, int> > limbKeypointsIds = {
+    static const std::pair<int, int> limbKeypointsIds[] = {
         {1, 2},  {1, 5},   {2, 3},
         {3, 4},  {5, 6},   {6, 7},
         {1, 8},  {8, 9},   {9, 10},
diff --git a/demos/multichannel_demo/hpe/render_human_pose.hpp b/demos/multi_channel/human_pose_estimation_demo/render_human_pose.hpp
similarity index 100%
rename from demos/multichannel_demo/hpe/render_human_pose.hpp
rename to demos/multi_channel/human_pose_estimation_demo/render_human_pose.hpp
diff --git a/demos/multi_channel/object_detection_demo_yolov3/CMakeLists.txt b/demos/multi_channel/object_detection_demo_yolov3/CMakeLists.txt
new file mode 100644
index 00000000000..1490e4242c7
--- /dev/null
+++ b/demos/multi_channel/object_detection_demo_yolov3/CMakeLists.txt
@@ -0,0 +1,79 @@
+# Copyright (C) 2018-2019 Intel Corporation
+
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+
+#      http://www.apache.org/licenses/LICENSE-2.0
+
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+set(TARGET_NAME "multi_channel_object_detection_demo_yolov3")
+
+if( BUILD_DEMO_NAME AND NOT ${BUILD_DEMO_NAME} STREQUAL ${TARGET_NAME} )
+    message(STATUS "DEMO ${TARGET_NAME} SKIPPED")
+    return()
+endif()
+
+# Find OpenCV components if exist
+find_package(OpenCV COMPONENTS highgui QUIET)
+if(NOT(OpenCV_FOUND))
+    message(WARNING "OPENCV is disabled or not found, " ${TARGET_NAME} " skipped")
+    return()
+endif()
+
+file (GLOB MAIN_SRC
+        ${CMAKE_CURRENT_SOURCE_DIR}/*.cpp
+        )
+
+file (GLOB MAIN_HEADERS
+        ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp
+        )
+
+# Create named folders for the sources within the .vcproj
+# Empty name lists them directly under the .vcproj
+source_group("src" FILES ${MAIN_SRC})
+source_group("include" FILES ${MAIN_HEADERS})
+
+# Create library file from sources.
+add_executable(${TARGET_NAME} ${MAIN_SRC} ${MAIN_HEADERS})
+
+set_target_properties(${TARGET_NAME} PROPERTIES
+    POSITION_INDEPENDENT_CODE ON
+    COMPILE_PDB_NAME ${TARGET_NAME})
+
+if(MULTICHANNEL_DEMO_USE_TBB)
+    find_package(TBB REQUIRED tbb)
+    target_link_libraries(${TARGET_NAME} ${TBB_IMPORTED_TARGETS})
+    target_compile_definitions(${TARGET_NAME} PRIVATE
+        USE_TBB=1
+        __TBB_ALLOW_MUTABLE_FUNCTORS=1)
+
+    if(FALSE) # disable task isolation for now due to bugs in tbb
+        target_compile_definitions(${TARGET_NAME} PRIVATE
+            TBB_PREVIEW_TASK_ISOLATION=1
+            TBB_TASK_ISOLATION=1)
+    endif()
+endif()
+
+target_link_libraries(${TARGET_NAME} ${InferenceEngine_LIBRARIES} gflags ${OpenCV_LIBRARIES} common)
+
+if(UNIX)
+    target_link_libraries( ${TARGET_NAME} pthread)
+endif()
+
+if(COMMAND add_cpplint_target)
+    add_cpplint_target(${TARGET_NAME}_cpplint FOR_TARGETS ${TARGET_NAME})
+endif()
+
+if(NOT TARGET ie_samples)
+    add_custom_target(ie_samples ALL)
+endif()
+
+add_dependencies(ie_samples ${TARGET_NAME})
+
+target_link_libraries(${TARGET_NAME} monitors)
diff --git a/demos/multi_channel/object_detection_demo_yolov3/README.md b/demos/multi_channel/object_detection_demo_yolov3/README.md
new file mode 100644
index 00000000000..636d5049e70
--- /dev/null
+++ b/demos/multi_channel/object_detection_demo_yolov3/README.md
@@ -0,0 +1,114 @@
+# Multi-Channel Object Detection Yolov3 C++ Demo
+
+This demo provides an inference pipeline for multi-channel yolo v3. The demo uses Yolo v3 Object Detection network. You can follow [this](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_YOLO_From_Tensorflow.html) page convert the YOLO V3 and tiny YOLO V3 into IR model and execute this demo with converted IR model.
+
+> **NOTES**:
+> If you don't use [this](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_YOLO_From_Tensorflow.html) page to convert the model, it may not work. 
+
+Other demo objectives are:
+
+* Up to 16 cameras as inputs, via OpenCV*
+* Visualization of detected objects from all channels on a single screen
+
+
+## How It Works
+
+On the start-up, the application reads command line parameters and loads the specified networks. The Yolo v3 Object Detection network is required.
+
+> **NOTES**:
+> * By default, Open Model Zoo demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html).
+
+## Running
+
+Running the application with the `-h` option yields the following usage message:
+```
+cd <samples_build_folder>/intel64/Release
+./multi_channel_object_detection_demo_yolov3 -h
+
+multi_channel_object_detection_demo_yolov3 [OPTION]
+Options:
+
+    -h                           Print a usage message.
+    -m "<path>"                  Required. Path to an .xml file with a trained yolo v3 or tiny yolo v3 model.
+      -l "<absolute_path>"       Required for MKLDNN (CPU)-targeted custom layers. Absolute path to a shared library with the kernels impl.
+          Or
+      -c "<absolute_path>"       Required for clDNN (GPU)-targeted custom kernels. Absolute path to the xml file with the kernels desc.
+    -d "<device>"                Optional. Specify the target device for Face Detection (CPU, GPU, FPGA, HDDL or MYRIAD). The demo will look for a suitable plugin for a specified device.
+    -nc                          Optional. Maximum number of processed camera inputs (web cams)
+    -bs                          Optional. Batch size for processing (the number of frames processed per infer request)
+    -nireq                       Optional. Number of infer requests
+    -n_iqs                       Optional. Frame queue size for input channels
+    -fps_sp                      Optional. FPS measurement sampling period. Duration between timepoints, msec
+    -n_sp                        Optional. Number of sampling periods
+    -pc                          Optional. Enables per-layer performance report.
+    -t                           Optional. Probability threshold for detections.
+    -no_show                     Optional. No show processed video.
+    -show_stats                  Optional. Enable statistics report
+    -duplicate_num               Optional. Enable and specify number of channel additionally copied from real sources
+    -real_input_fps              Optional. Disable input frames caching, for maximum throughput pipeline
+    -i                           Optional. Specify full path to input video files
+    -u                           Optional. List of monitors to show initially.
+```
+
+To run the demo, you can use public pre-train model and follow [this](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_tf_specific_Convert_YOLO_From_Tensorflow.html) page for instruction of how to convert it to IR model. 
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (\*.xml + \*.bin) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+
+For example, to run the demo on FPGA with fallback on CPU, with one single camera, use the following command:
+```sh
+./multi_channel_object_detection_demo_yolov3 -m $PATH_OF_YOLO_V3_MODEL -d HETERO:FPGA,CPU -nc 1
+```
+
+To run the demo using two recorded video files, use the following command:
+```sh
+./multi_channel_object_detection_demo_yolov3 -m $PATH_OF_YOLO_V3_MODEL -d HDDL -i /path/to/file1 /path/to/file2
+```
+Video files will be processed repeatedly.
+
+To achieve 100% utilization of one Myriad X, the thumb rule is to run 4 infer requests on each Myriad X. Option `-nireq 32` can be added to above command to use 100% of HDDL-R card. The 32 here is 8 (Myriad X on HDDL-R card) x 4 (infer requests), such as following command:
+
+```sh
+./multi_channel_object_detection_demo_yolov3 -m $PATH_OF_YOLO_V3_MODEL -d HDDL 
+-i /path/to/file1 /path/to/file2 /path/to/file3 /path/to/file4 -nireq 32
+```
+
+You can also run the demo on web cameras and video files simultaneously by specifying both parameters: `-nc <number of cams> -i <video files sequentially, separated by space>`.
+To run the demo with a single input source(a web camera or a video file), but several channels, specify an additional parameter: `-duplicate_num 3`. You will see four channels: one real and three duplicated. With several input sources, the `-duplicate_num` parameter will duplicate each of them.
+
+## Demo Output
+
+The demo uses OpenCV to display the resulting frames with detections rendered as bounding boxes.
+On the top of the screen, the demo reports throughput in frames per second. You can also enable more detailed statistics in the output using the `-show_stats` option while running the demos.
+
+
+## Input Video Sources
+
+General parameter for input video source is `-i`. Use it to specify video files and web cameras (**USB cameras**) as input video source. You can add the parameter to a sample command line as follows:
+```
+-i <file1> <file2>
+```
+
+`-nc <nc_value>` parameter simplifies usage of multiple web cameras. It connects web cameras with indexes from `0` to `nc_value-1`.
+
+To see all available web cameras, run the `ls /dev/video*` command. You will get output similar to the following:
+
+```
+user@user-PC:~ $ ls /dev/video*
+/dev/video0  /dev/video1  /dev/video2
+```
+
+You can use `-i` option to connect all the three web cameras:
+
+```
+-i /dev/video0  /dev/video1  /dev/video2
+```
+
+Alternatively, you can just set `-nc 3`, which simplifies application usage.
+
+If your cameras are connected to PC with indexes gap (for example, `0,1,3`), use the `-i` parameter.
+
+IP-cameras through RSTP URI interface are not supported.
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
diff --git a/demos/multi_channel/object_detection_demo_yolov3/main.cpp b/demos/multi_channel/object_detection_demo_yolov3/main.cpp
new file mode 100644
index 00000000000..12147d6fdd3
--- /dev/null
+++ b/demos/multi_channel/object_detection_demo_yolov3/main.cpp
@@ -0,0 +1,615 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+/**
+* \brief The entry point for the Inference Engine multichannel_yolo_detection demo application
+* \file multichannel_yolo_detection/main.cpp
+* \example multichannel_yolo_detection/main.cpp
+*/
+#include <iostream>
+#include <vector>
+#include <utility>
+
+#include <algorithm>
+#include <mutex>
+#include <condition_variable>
+#include <thread>
+#include <atomic>
+#include <queue>
+#include <chrono>
+#include <sstream>
+#include <memory>
+#include <string>
+
+#ifdef USE_TBB
+#include <tbb/parallel_for.h>
+#endif
+
+#include <opencv2/opencv.hpp>
+
+#include <monitors/presenter.h>
+#include <samples/slog.hpp>
+#include <samples/args_helper.hpp>
+
+#include "input.hpp"
+#include "multichannel_params.hpp"
+#include "multichannel_object_detection_demo_yolov3_params.hpp"
+#include "output.hpp"
+#include "threading.hpp"
+#include "graph.hpp"
+
+namespace {
+
+/**
+* \brief This function show a help message
+*/
+void showUsage() {
+    std::cout << std::endl;
+    std::cout << "multi_channel_yolo_v3_demo [OPTION]" << std::endl;
+    std::cout << "Options:" << std::endl;
+    std::cout << std::endl;
+    std::cout << "    -h                           " << help_message << std::endl;
+    std::cout << "    -m \"<path>\"                  " << model_path_message<< std::endl;
+    std::cout << "      -l \"<absolute_path>\"       " << custom_cpu_library_message << std::endl;
+    std::cout << "          Or" << std::endl;
+    std::cout << "      -c \"<absolute_path>\"       " << custom_cldnn_message << std::endl;
+    std::cout << "    -d \"<device>\"                " << target_device_message << std::endl;
+    std::cout << "    -nc                          " << num_cameras << std::endl;
+    std::cout << "    -bs                          " << batch_size << std::endl;
+    std::cout << "    -nireq                       " << num_infer_requests << std::endl;
+    std::cout << "    -n_iqs                       " << input_queue_size << std::endl;
+    std::cout << "    -fps_sp                      " << fps_sampling_period << std::endl;
+    std::cout << "    -n_sp                        " << num_sampling_periods << std::endl;
+    std::cout << "    -pc                          " << performance_counter_message << std::endl;
+    std::cout << "    -t                           " << thresh_output_message << std::endl;
+    std::cout << "    -no_show                     " << no_show_processed_video << std::endl;
+    std::cout << "    -show_stats                  " << show_statistics << std::endl;
+    std::cout << "    -duplicate_num               " << duplication_channel_number << std::endl;
+    std::cout << "    -real_input_fps              " << real_input_fps << std::endl;
+    std::cout << "    -i                           " << input_video << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
+}
+
+bool ParseAndCheckCommandLine(int argc, char *argv[]) {
+    // ---------------------------Parsing and validation of input args--------------------------------------
+    gflags::ParseCommandLineNonHelpFlags(&argc, &argv, true);
+    if (FLAGS_h) {
+        showUsage();
+        showAvailableDevices();
+        return false;
+    }
+    slog::info << "Parsing input parameters" << slog::endl;
+
+    if (FLAGS_m.empty()) {
+        throw std::logic_error("Parameter -m is not set");
+    }
+    if (FLAGS_nc == 0 && FLAGS_i.empty()) {
+        throw std::logic_error("Please specify at least one video source(web cam or video file)");
+    }
+    slog::info << "\tDetection model:           " << FLAGS_m << slog::endl;
+    slog::info << "\tDetection threshold:       " << FLAGS_t << slog::endl;
+    slog::info << "\tUtilizing device:          " << FLAGS_d << slog::endl;
+    if (!FLAGS_l.empty()) {
+        slog::info << "\tCPU extension library:     " << FLAGS_l << slog::endl;
+    }
+    if (!FLAGS_c.empty()) {
+        slog::info << "\tCLDNN custom kernels map:  " << FLAGS_c << slog::endl;
+    }
+    slog::info << "\tBatch size:                " << FLAGS_bs << slog::endl;
+    slog::info << "\tNumber of infer requests:  " << FLAGS_nireq << slog::endl;
+    slog::info << "\tNumber of input web cams:  "  << FLAGS_nc << slog::endl;
+
+    return true;
+}
+
+static int EntryIndex(int side, int lcoords, int lclasses, int location, int entry) {
+    int n = location / (side * side);
+    int loc = location % (side * side);
+    return n * side * side * (lcoords + lclasses + 1) + entry * side * side + loc;
+}
+
+struct YoloParams {
+    int num;
+    int classes;
+    int coords;
+
+    std::vector<float> anchors;
+};
+
+struct DetectionObject {
+    int xmin, ymin, xmax, ymax, class_id;
+    float confidence;
+
+    DetectionObject(double x, double y, double h, double w, int class_id, float confidence, float h_scale, float w_scale) :
+        xmin{static_cast<int>((x - w / 2) * w_scale)},
+        ymin{static_cast<int>((y - h / 2) * h_scale)},
+        xmax{static_cast<int>(this->xmin + w * w_scale)},
+        ymax{static_cast<int>(this->ymin + h * h_scale)},
+        class_id{class_id},
+        confidence{confidence} {}
+
+    bool operator <(const DetectionObject &s2) const {
+        return this->confidence < s2.confidence;
+    }
+    bool operator >(const DetectionObject &s2) const {
+        return this->confidence > s2.confidence;
+    }
+};
+
+double IntersectionOverUnion(const DetectionObject &box_1, const DetectionObject &box_2) {
+    double width_of_overlap_area = fmin(box_1.xmax, box_2.xmax) - fmax(box_1.xmin, box_2.xmin);
+    double height_of_overlap_area = fmin(box_1.ymax, box_2.ymax) - fmax(box_1.ymin, box_2.ymin);
+    double area_of_overlap;
+    if (width_of_overlap_area < 0 || height_of_overlap_area < 0)
+        area_of_overlap = 0;
+    else
+        area_of_overlap = width_of_overlap_area * height_of_overlap_area;
+    double box_1_area = (box_1.ymax - box_1.ymin)  * (box_1.xmax - box_1.xmin);
+    double box_2_area = (box_2.ymax - box_2.ymin)  * (box_2.xmax - box_2.xmin);
+    double area_of_union = box_1_area + box_2_area - area_of_overlap;
+    return area_of_overlap / area_of_union;
+}
+
+void ParseYOLOV3Output(InferenceEngine::InferRequest::Ptr req,
+                       const std::string &outputName,
+                       const YoloParams &yoloParams, const unsigned long resized_im_h,
+                       const unsigned long resized_im_w, const unsigned long original_im_h,
+                       const unsigned long original_im_w,
+                       const double threshold, std::vector<DetectionObject> &objects) {
+    InferenceEngine::Blob::Ptr blob = req->GetBlob(outputName);
+
+    const int out_blob_h = static_cast<int>(blob->getTensorDesc().getDims()[2]);
+    const int out_blob_w = static_cast<int>(blob->getTensorDesc().getDims()[3]);
+    if (out_blob_h != out_blob_w)
+        throw std::runtime_error("Invalid size of output. It should be in NCHW layout and H should be equal to W. Current H = " + std::to_string(out_blob_h) +
+        ", current W = " + std::to_string(out_blob_h));
+
+    auto num = yoloParams.num;
+    auto coords = yoloParams.coords;
+    auto classes = yoloParams.classes;
+
+    auto anchors = yoloParams.anchors;
+
+    auto side = out_blob_h;
+    auto side_square = side * side;
+    const float *output_blob = blob->buffer().as<InferenceEngine::PrecisionTrait<InferenceEngine::Precision::FP32>::value_type *>();
+    // --------------------------- Parsing YOLO Region output -------------------------------------
+    for (int i = 0; i < side_square; ++i) {
+        int row = i / side;
+        int col = i % side;
+        for (int n = 0; n < num; ++n) {
+            int obj_index = EntryIndex(side, coords, classes, n * side * side + i, coords);
+            int box_index = EntryIndex(side, coords, classes, n * side * side + i, 0);
+            float scale = output_blob[obj_index];
+            if (scale < threshold)
+                continue;
+            double x = (col + output_blob[box_index + 0 * side_square]) / side * resized_im_w;
+            double y = (row + output_blob[box_index + 1 * side_square]) / side * resized_im_h;
+            double height = std::exp(output_blob[box_index + 3 * side_square]) * anchors[2 * n + 1];
+            double width = std::exp(output_blob[box_index + 2 * side_square]) * anchors[2 * n];
+            for (int j = 0; j < classes; ++j) {
+                int class_index = EntryIndex(side, coords, classes, n * side_square + i, coords + 1 + j);
+                float prob = scale * output_blob[class_index];
+                if (prob < threshold)
+                    continue;
+                DetectionObject obj(x, y, height, width, j, prob,
+                        static_cast<float>(original_im_h) / static_cast<float>(resized_im_h),
+                        static_cast<float>(original_im_w) / static_cast<float>(resized_im_w));
+                objects.push_back(obj);
+            }
+        }
+    }
+}
+
+void drawDetections(cv::Mat& img, const std::vector<DetectionObject>& detections, const std::vector<cv::Scalar>& colors) {
+    for (const DetectionObject& f : detections) {
+        cv::rectangle(img,
+                      cv::Rect2f(static_cast<float>(f.xmin),
+                                 static_cast<float>(f.ymin),
+                                 static_cast<float>((f.xmax-f.xmin)),
+                                 static_cast<float>((f.ymax-f.ymin))),
+                      colors[static_cast<int>(f.class_id)],
+                      2);
+    }
+}
+
+const size_t DISP_WIDTH  = 1920;
+const size_t DISP_HEIGHT = 1080;
+const size_t MAX_INPUTS  = 25;
+
+struct DisplayParams {
+    std::string name;
+    cv::Size windowSize;
+    cv::Size frameSize;
+    size_t count;
+    cv::Point points[MAX_INPUTS];
+};
+
+DisplayParams prepareDisplayParams(size_t count) {
+    DisplayParams params;
+    params.count = count;
+    params.windowSize = cv::Size(DISP_WIDTH, DISP_HEIGHT);
+
+    size_t gridCount = static_cast<size_t>(ceil(sqrt(count)));
+    size_t gridStepX = static_cast<size_t>(DISP_WIDTH/gridCount);
+    size_t gridStepY = static_cast<size_t>(DISP_HEIGHT/gridCount);
+    params.frameSize = cv::Size(gridStepX, gridStepY);
+
+    for (size_t i = 0; i < count; i++) {
+        cv::Point p;
+        p.x = gridStepX * (i/gridCount);
+        p.y = gridStepY * (i%gridCount);
+        params.points[i] = p;
+    }
+    return params;
+}
+
+std::map<std::string, YoloParams> GetYoloParams(const std::vector<std::string>& outputDataBlobNames,
+                                                InferenceEngine::CNNNetwork &network) {
+    std::map<std::string, YoloParams> __yoloParams;
+
+    for (auto &output_name :outputDataBlobNames) {
+        InferenceEngine::CNNLayerPtr layer = network.getLayerByName(output_name.c_str());
+
+        if (layer->type != "RegionYolo")
+            throw std::runtime_error("Invalid output type: " + layer->type + ". RegionYolo expected");
+
+        auto num = layer->GetParamAsInt("num");
+        auto coords = layer->GetParamAsInt("coords");
+        auto classes = layer->GetParamAsInt("classes");
+
+        std::vector<float> anchors = layer->GetParamAsFloats("anchors");
+
+        auto mask = layer->GetParamAsInts("mask");
+        num = mask.size();
+
+        std::vector<float> maskedAnchors(num * 2);
+        for (int i = 0; i < num; ++i) {
+            maskedAnchors[i * 2] = anchors[mask[i] * 2];
+            maskedAnchors[i * 2 + 1] = anchors[mask[i] * 2 + 1];
+        }
+        anchors = maskedAnchors;
+
+        YoloParams param{num, classes, coords, anchors};
+        __yoloParams.insert(std::pair<std::string, YoloParams>(output_name.c_str(), param));
+    }
+
+    return __yoloParams;
+}
+
+void displayNSources(const std::vector<std::shared_ptr<VideoFrame>>& data,
+                     float time,
+                     const std::string& stats,
+                     const DisplayParams& params,
+                     const std::vector<cv::Scalar> &colors,
+                     Presenter& presenter) {
+    cv::Mat windowImage = cv::Mat::zeros(params.windowSize, CV_8UC3);
+    auto loopBody = [&](size_t i) {
+        auto& elem = data[i];
+        if (!elem->frame.empty()) {
+            cv::Rect rectFrame = cv::Rect(params.points[i], params.frameSize);
+            cv::Mat windowPart = windowImage(rectFrame);
+            cv::resize(elem->frame, windowPart, params.frameSize);
+            drawDetections(windowPart, elem->detections.get<std::vector<DetectionObject>>(), colors);
+        }
+    };
+
+    auto drawStats = [&]() {
+        if (FLAGS_show_stats && !stats.empty()) {
+            static const cv::Point posPoint = cv::Point(3*DISP_WIDTH/4, 4*DISP_HEIGHT/5);
+            auto pos = posPoint + cv::Point(0, 25);
+            size_t currPos = 0;
+            while (true) {
+                auto newPos = stats.find('\n', currPos);
+                cv::putText(windowImage, stats.substr(currPos, newPos - currPos), pos, cv::HersheyFonts::FONT_HERSHEY_COMPLEX, 0.8,  cv::Scalar(0, 0, 255), 1);
+                if (newPos == std::string::npos) {
+                    break;
+                }
+                pos += cv::Point(0, 25);
+                currPos = newPos + 1;
+            }
+        }
+    };
+
+//  #ifdef USE_TBB
+#if 0  // disable multithreaded rendering for now
+    run_in_arena([&](){
+        tbb::parallel_for<size_t>(0, data.size(), [&](size_t i) {
+            loopBody(i);
+        });
+    });
+#else
+    for (size_t i = 0; i < data.size(); ++i) {
+        loopBody(i);
+    }
+#endif
+    presenter.drawGraphs(windowImage);
+    drawStats();
+
+    char str[256];
+    snprintf(str, sizeof(str), "%5.2f fps", static_cast<double>(1000.0f/time));
+    cv::putText(windowImage, str, cv::Point(800, 100), cv::HersheyFonts::FONT_HERSHEY_COMPLEX, 2.0,  cv::Scalar(0, 255, 0), 2);
+    cv::imshow(params.name, windowImage);
+}
+
+}  // namespace
+
+int main(int argc, char* argv[]) {
+    try {
+#if USE_TBB
+        TbbArenaWrapper arena;
+#endif
+
+        slog::info << "InferenceEngine: " << InferenceEngine::GetInferenceEngineVersion() << slog::endl;
+
+        // ------------------------------ Parsing and validation of input args ---------------------------------
+        if (!ParseAndCheckCommandLine(argc, argv)) {
+            return 0;
+        }
+
+        std::string modelPath = FLAGS_m;
+        std::size_t found = modelPath.find_last_of(".");
+        if (found > modelPath.size()) {
+            slog::info << "Invalid model name: " << modelPath << slog::endl;
+            slog::info << "Expected to be <model_name>.xml" << slog::endl;
+            return -1;
+        }
+        slog::info << "Model   path: " << modelPath << slog::endl;
+
+        std::map<std::string, YoloParams> yoloParams;
+
+        IEGraph::InitParams graphParams;
+        graphParams.batchSize       = FLAGS_bs;
+        graphParams.maxRequests     = FLAGS_nireq;
+        graphParams.collectStats    = FLAGS_show_stats;
+        graphParams.reportPerf      = FLAGS_pc;
+        graphParams.modelPath       = modelPath;
+        graphParams.cpuExtPath      = FLAGS_l;
+        graphParams.cldnnConfigPath = FLAGS_c;
+        graphParams.deviceName      = FLAGS_d;
+        graphParams.postLoadFunc    = [&yoloParams](const std::vector<std::string>& outputDataBlobNames,
+                                                    InferenceEngine::CNNNetwork &network) {
+                                                        yoloParams = GetYoloParams(outputDataBlobNames, network);
+                                                    };
+
+        std::shared_ptr<IEGraph> network(new IEGraph(graphParams));
+        auto inputDims = network->getInputDims();
+        if (4 != inputDims.size()) {
+            throw std::runtime_error("Invalid network input dimensions");
+        }
+
+        std::vector<std::string> files;
+        parseInputFilesArguments(files);
+
+        slog::info << "\tNumber of input web cams:    " << FLAGS_nc << slog::endl;
+        slog::info << "\tNumber of input video files: " << files.size() << slog::endl;
+        slog::info << "\tDuplication multiplayer:     " << FLAGS_duplicate_num << slog::endl;
+
+        const auto duplicateFactor = (1 + FLAGS_duplicate_num);
+        size_t numberOfInputs = (FLAGS_nc + files.size()) * duplicateFactor;
+
+        DisplayParams params = prepareDisplayParams(numberOfInputs);
+
+        slog::info << "\tNumber of input channels:    " << numberOfInputs << slog::endl;
+        if (numberOfInputs > MAX_INPUTS) {
+            throw std::logic_error("Number of inputs exceed maximum value [25]");
+        }
+
+        VideoSources::InitParams vsParams;
+        vsParams.queueSize            = FLAGS_n_iqs;
+        vsParams.collectStats         = FLAGS_show_stats;
+        vsParams.realFps              = FLAGS_real_input_fps;
+        vsParams.expectedHeight = static_cast<unsigned>(inputDims[2]);
+        vsParams.expectedWidth  = static_cast<unsigned>(inputDims[3]);
+
+        VideoSources sources(vsParams);
+        if (!files.empty()) {
+            slog::info << "Trying to open input video ..." << slog::endl;
+            for (auto& file : files) {
+                try {
+                    sources.openVideo(file, false);
+                } catch (...) {
+                    slog::info << "Cannot open video [" << file << "]" << slog::endl;
+                    throw;
+                }
+            }
+        }
+        if (FLAGS_nc) {
+            slog::info << "Trying to connect " << FLAGS_nc << " web cams ..." << slog::endl;
+            for (size_t i = 0; i < FLAGS_nc; ++i) {
+                try {
+                    sources.openVideo(std::to_string(i), true);
+                } catch (...) {
+                    slog::info << "Cannot open web cam [" << i << "]" << slog::endl;
+                    throw;
+                }
+            }
+        }
+        sources.start();
+
+        size_t currentFrame = 0;
+
+        std::vector<cv::Scalar> colors;
+        if (yoloParams.size() > 0)
+            for (int i = 0; i < static_cast<int>(yoloParams.begin()->second.classes); ++i)
+                colors.push_back(cv::Scalar(rand() % 256, rand() % 256, rand() % 256));
+
+        network->start([&](VideoFrame& img) {
+            img.sourceIdx = currentFrame;
+            auto camIdx = currentFrame / duplicateFactor;
+            currentFrame = (currentFrame + 1) % numberOfInputs;
+            return sources.getFrame(camIdx, img);
+        }, [&yoloParams](InferenceEngine::InferRequest::Ptr req,
+                const std::vector<std::string>& outputDataBlobNames,
+                cv::Size frameSize
+                ) {
+            unsigned long resized_im_h = 416;
+            unsigned long resized_im_w = 416;
+
+            std::vector<DetectionObject> objects;
+            // Parsing outputs
+            for (auto &output_name :outputDataBlobNames) {
+                ParseYOLOV3Output(req, output_name, yoloParams[output_name], resized_im_h, resized_im_w, frameSize.height, frameSize.width, FLAGS_t, objects);
+            }
+            // Filtering overlapping boxes and lower confidence object
+            std::sort(objects.begin(), objects.end(), std::greater<DetectionObject>());
+            for (size_t i = 0; i < objects.size(); ++i) {
+                if (objects[i].confidence == 0)
+                    continue;
+                for (size_t j = i + 1; j < objects.size(); ++j)
+                    if (IntersectionOverUnion(objects[i], objects[j]) >= 0.4)
+                        objects[j].confidence = 0;
+            }
+
+            std::vector<Detections> detections(1);
+            detections[0].set(new std::vector<DetectionObject>);
+
+            for (auto &object : objects) {
+                if (object.confidence < FLAGS_t)
+                    continue;
+                detections[0].get<std::vector<DetectionObject>>().push_back(object);
+            }
+
+            return detections;
+        });
+
+        network->setDetectionConfidence(static_cast<float>(FLAGS_t));
+
+        std::atomic<float> averageFps = {0.0f};
+
+        std::vector<std::shared_ptr<VideoFrame>> batchRes;
+
+        std::mutex statMutex;
+        std::stringstream statStream;
+
+        std::cout << "To close the application, press 'CTRL+C' here";
+        if (!FLAGS_no_show) {
+            std::cout << " or switch to the output window and press ESC key";
+        }
+        std::cout << std::endl;
+
+        cv::Size graphSize{static_cast<int>(params.windowSize.width / 4), 60};
+        Presenter presenter(FLAGS_u, params.windowSize.height - graphSize.height - 10, graphSize);
+
+        const size_t outputQueueSize = 1;
+        AsyncOutput output(FLAGS_show_stats, outputQueueSize,
+        [&](const std::vector<std::shared_ptr<VideoFrame>>& result) {
+            std::string str;
+            if (FLAGS_show_stats) {
+                std::unique_lock<std::mutex> lock(statMutex);
+                str = statStream.str();
+            }
+            displayNSources(result, averageFps, str, params, colors, presenter);
+            int key = cv::waitKey(1);
+            presenter.handleKey(key);
+
+            return (key != 27);
+        });
+
+        output.start();
+
+        using timer = std::chrono::high_resolution_clock;
+        using duration = std::chrono::duration<float, std::milli>;
+        timer::time_point lastTime = timer::now();
+        duration samplingTimeout(FLAGS_fps_sp);
+
+        size_t fpsCounter = 0;
+
+        size_t perfItersCounter = 0;
+
+        while (sources.isRunning() || network->isRunning()) {
+            bool readData = true;
+            while (readData) {
+                auto br = network->getBatchData(params.frameSize);
+                if (br.empty()) {
+                    break;
+                }
+                for (size_t i = 0; i < br.size(); i++) {
+                    auto val = static_cast<unsigned int>(br[i]->sourceIdx);
+                    auto it = find_if(batchRes.begin(), batchRes.end(), [val] (const std::shared_ptr<VideoFrame>& vf) { return vf->sourceIdx == val; } );
+                    if (it != batchRes.end()) {
+                        if (!FLAGS_no_show) {
+                            output.push(std::move(batchRes));
+                        }
+                        batchRes.clear();
+                        readData = false;
+                    }
+                    batchRes.push_back(std::move(br[i]));
+                }
+            }
+            ++fpsCounter;
+
+            if (!output.isAlive()) {
+                break;
+            }
+
+            auto currTime = timer::now();
+            auto deltaTime = (currTime - lastTime);
+            if (deltaTime >= samplingTimeout) {
+                auto durMsec =
+                        std::chrono::duration_cast<duration>(deltaTime).count();
+                auto frameTime = durMsec / static_cast<float>(fpsCounter);
+                fpsCounter = 0;
+                lastTime = currTime;
+
+                if (FLAGS_no_show) {
+                    slog::info << "Average Throughput : " << 1000.f/frameTime << " fps" << slog::endl;
+                    if (++perfItersCounter >= FLAGS_n_sp) {
+                        break;
+                    }
+                } else {
+                    averageFps = frameTime;
+                }
+
+                if (FLAGS_show_stats) {
+                    auto inputStat = sources.getStats();
+                    auto inferStat = network->getStats();
+                    auto outputStat = output.getStats();
+
+                    std::unique_lock<std::mutex> lock(statMutex);
+                    statStream.str(std::string());
+                    statStream << std::fixed << std::setprecision(1);
+                    statStream << "Input reads: ";
+                    for (size_t i = 0; i < inputStat.readTimes.size(); ++i) {
+                        if (0 == (i % 4)) {
+                            statStream << std::endl;
+                        }
+                        statStream << inputStat.readTimes[i] << "ms ";
+                    }
+                    statStream << std::endl;
+                    statStream << "HW decoding latency: "
+                               << inputStat.decodingLatency << "ms";
+                    statStream << std::endl;
+                    statStream << "Preprocess time: "
+                               << inferStat.preprocessTime << "ms";
+                    statStream << std::endl;
+                    statStream << "Plugin latency: "
+                               << inferStat.inferTime << "ms";
+                    statStream << std::endl;
+
+                    statStream << "Render time: " << outputStat.renderTime
+                               << "ms" << std::endl;
+
+                    if (FLAGS_no_show) {
+                        slog::info << statStream.str() << slog::endl;
+                    }
+                }
+            }
+        }
+
+        network.reset();
+
+        std::cout << presenter.reportMeans() << '\n';
+    }
+    catch (const std::exception& error) {
+        slog::err << error.what() << slog::endl;
+        return 1;
+    }
+    catch (...) {
+        slog::err << "Unknown/internal exception happened." << slog::endl;
+        return 1;
+    }
+
+    slog::info << "Execution successful" << slog::endl;
+    return 0;
+}
diff --git a/demos/multi_channel/object_detection_demo_yolov3/multichannel_object_detection_demo_yolov3_params.hpp b/demos/multi_channel/object_detection_demo_yolov3/multichannel_object_detection_demo_yolov3_params.hpp
new file mode 100644
index 00000000000..b4ef8ee7ec2
--- /dev/null
+++ b/demos/multi_channel/object_detection_demo_yolov3/multichannel_object_detection_demo_yolov3_params.hpp
@@ -0,0 +1,13 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <string>
+#include <vector>
+#include <gflags/gflags.h>
+
+static const char thresh_output_message[] = "Optional. Probability threshold for detections";
+
+DEFINE_double(t, 0.5, thresh_output_message);
diff --git a/demos/multichannel_demo/README.md b/demos/multichannel_demo/README.md
deleted file mode 100644
index 90176bc9499..00000000000
--- a/demos/multichannel_demo/README.md
+++ /dev/null
@@ -1,5 +0,0 @@
-# Multi-Channel C++ Demos
-
-The demos provide an inference pipeline for two multi-channel scenarios: face detection and human pose estimation. For more information, refer to the corresponding pages:
-* [Multi-Channel Face Detection C++ Demo](./fd/README.md)
-* [Multi-Channel Human Pose Estimation C++ Demo](./hpe/README.md)
diff --git a/demos/multichannel_demo/common/multichannel_params.hpp b/demos/multichannel_demo/common/multichannel_params.hpp
deleted file mode 100644
index f3a24ca8d5c..00000000000
--- a/demos/multichannel_demo/common/multichannel_params.hpp
+++ /dev/null
@@ -1,129 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <string>
-#include <vector>
-#include <gflags/gflags.h>
-
-/// @brief Message for help argument
-static const char help_message[] = "Print a usage message";
-
-/// @brief Message for model argument
-static const char face_detection_model_message[] = "Required. Path to an .xml file with a trained model.";
-
-/// @brief Message for assigning face detection calculation to a device
-static const char target_device_message[] = "Optional. Specify the target device for a network (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo looks for a suitable plugin for a specified device.";
-
-/// @brief Message for performance counters
-static const char performance_counter_message[] = "Optional. Enable per-layer performance report";
-
-/// @brief Message for GPU custom kernels descriptions
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to an .xml file with the kernels descriptions";
-
-/// @brief Message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementations";
-
-/// @brief Message for not showing a processed video
-static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief Message for the number of camera inputs
-static const char num_cameras[] = "Optional. Maximum number of processed camera inputs (web cameras)";
-
-/// @brief Message for batch size
-static const char batch_size[] = "Optional. Batch size for processing (the number of frames processed per infer request)";
-
-/// @brief Message for the number of infer requests
-static const char num_infer_requests[] = "Optional. Number of infer requests";
-
-/// @brief Message for inputs queue size
-static const char input_queue_size[] = "Optional. Frame queue size for input channels";
-
-/// @brief Message for FPS measurement sampling period
-static const char fps_sampling_period[] = "Optional. FPS measurement sampling period between timepoints in msec";
-
-/// @brief Message for the number of sampling periods
-static const char num_sampling_periods[] = "Optional. Number of sampling periods";
-
-/// @brief Message for enabling statistics output
-static const char show_statistics[] = "Optional. Enable statistics report";
-
-/// @brief Message for enabling channel duplication
-static const char duplication_channel_number[] = "Optional. Enable and specify the number of channels additionally copied from real sources";
-
-/// @brief Message for enabling real input FPS
-static const char real_input_fps[] = "Optional. Disable input frames caching, for maximum throughput pipeline";
-
-/// @brief Message for enabling input video
-static const char input_video[] = "Optional. Specify full path to input video files";
-
-/// \brief Define a flag for showing help message <br>
-DEFINE_bool(h, false, help_message);
-
-/// \brief Define a parameter for a model file <br>
-/// It is a required parameter
-DEFINE_string(m, "", face_detection_model_message);
-
-/// \brief Define a target device parameter for a model <br>
-DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief Define a flag to enable per-layer performance report <br>
-DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief GPU custom kernels path <br>
-/// Default is ./lib
-DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
-DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Flag to disable showing processed video<br>
-/// It is an optional parameter
-DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// \brief Flag to specify the number of expected input channels<br>
-/// It is an optional parameter
-DEFINE_uint32(nc, 0, num_cameras);
-
-/// \brief Flag to specify batch size<br>
-/// It is an optional parameter
-DEFINE_uint32(bs, 1, batch_size);
-
-/// \brief Flag to specify the number of infer requests<br>
-/// It is an optional parameter
-DEFINE_uint32(nireq, 5, num_infer_requests);
-
-/// \brief Flag to specify the number of expected input channels<br>
-/// It is an optional parameter
-DEFINE_uint32(n_iqs, 5, input_queue_size);
-
-/// \brief Flag to specify FPS measurement sampling period<br>
-/// It is an optional parameter
-DEFINE_uint32(fps_sp, 1000, fps_sampling_period);
-
-/// \brief Flag to specify the number of sampling periods<br>
-/// It is an optional parameter
-DEFINE_uint32(n_sp, 10, num_sampling_periods);
-
-/// \brief Flag to enable statisics output<br>
-/// It is an optional parameter
-DEFINE_bool(show_stats, false, show_statistics);
-
-/// \brief Flag to enable and specify the number of channels additionally copied from real sources<br>
-/// It is an optional parameter
-DEFINE_uint32(duplicate_num, 0, duplication_channel_number);
-
-/// \brief Flag to enable real input FPS<br>
-/// It is an optional parameter
-DEFINE_bool(real_input_fps, false, real_input_fps);
-
-/// \brief Define parameter for input video files <br>
-/// It is a optional parameter
-DEFINE_string(i, "", input_video);
diff --git a/demos/object_detection_demo_faster_rcnn/CMakeLists.txt b/demos/object_detection_demo_faster_rcnn/CMakeLists.txt
index ad5aded67d6..04eb26e8867 100644
--- a/demos/object_detection_demo_faster_rcnn/CMakeLists.txt
+++ b/demos/object_detection_demo_faster_rcnn/CMakeLists.txt
@@ -6,4 +6,4 @@ ie_add_sample(NAME object_detection_demo_faster_rcnn
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/object_detection_demo_faster_rcnn.h"
                       "${CMAKE_CURRENT_SOURCE_DIR}/detectionoutput.h"
-              DEPENDENCIES format_reader)
+              OPENCV_DEPENDENCIES core imgcodecs imgproc)
diff --git a/demos/object_detection_demo_faster_rcnn/README.md b/demos/object_detection_demo_faster_rcnn/README.md
index b62201c0680..b0ae3df0ce5 100644
--- a/demos/object_detection_demo_faster_rcnn/README.md
+++ b/demos/object_detection_demo_faster_rcnn/README.md
@@ -29,7 +29,7 @@ output image and outputs data to the standard output stream.
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./object_detection_demo_faster_rcnn -h
 InferenceEngine:
     API version ............ <version>
diff --git a/demos/object_detection_demo_faster_rcnn/detectionoutput.h b/demos/object_detection_demo_faster_rcnn/detectionoutput.h
index eef03fe6fbb..074480c44f2 100644
--- a/demos/object_detection_demo_faster_rcnn/detectionoutput.h
+++ b/demos/object_detection_demo_faster_rcnn/detectionoutput.h
@@ -9,6 +9,8 @@
 #include <utility>
 #include <algorithm>
 
+#include <inference_engine.hpp>
+
 using namespace InferenceEngine;
 using InferenceEngine::details::InferenceEngineException;
 
@@ -24,90 +26,63 @@ static bool SortScorePairDescend(const std::pair<float, T>& pair1,
  * In our demo we use it as a post-processing class for Faster-RCNN networks
  */
 class DetectionOutputPostProcessor {
-    CNNLayer cnnLayer;
-
 public:
-    explicit DetectionOutputPostProcessor(const CNNLayer* layer): cnnLayer(*layer) {
+    explicit DetectionOutputPostProcessor(const SizeVector &image_dims,
+                                          const SizeVector &loc_dims,
+                                          const SizeVector &conf_dims,
+                                          const SizeVector &prior_dims) {
         try {
-            if (cnnLayer.insData.size() != 3)
-                THROW_IE_EXCEPTION << "Incorrect number of input edges for layer " << cnnLayer.name;
-            if (cnnLayer.outData.empty())
-                THROW_IE_EXCEPTION << "Incorrect number of output edges for layer " << cnnLayer.name;
-
-            _num_classes = cnnLayer.GetParamAsInt("num_classes");
-            _background_label_id = cnnLayer.GetParamAsInt("background_label_id", 0);
-            _top_k = cnnLayer.GetParamAsInt("top_k", -1);
-            _variance_encoded_in_target = cnnLayer.GetParamAsBool("variance_encoded_in_target", false);
-            _keep_top_k = cnnLayer.GetParamAsInt("keep_top_k", -1);
-            _nms_threshold = cnnLayer.GetParamAsFloat("nms_threshold");
-            _confidence_threshold = cnnLayer.GetParamAsFloat("confidence_threshold", -FLT_MAX);
-            _share_location = cnnLayer.GetParamAsBool("share_location", true);
-            _normalized = cnnLayer.GetParamAsBool("normalized", true);
-            _image_height = cnnLayer.GetParamAsInt("input_height", 1);
-            _image_width = cnnLayer.GetParamAsInt("input_width", 1);
-            _prior_size = _normalized ? 4 : 5;
-            _offset = _normalized ? 0 : 1;
-            _num_loc_classes = _share_location ? 1 : _num_classes;
-
-            std::string code_type_str = cnnLayer.GetParamAsString("code_type", "caffe.PriorBoxParameter.CORNER");
-            _code_type = (code_type_str == "caffe.PriorBoxParameter.CENTER_SIZE" ? CodeType::CENTER_SIZE
-                                                                                 : CodeType::CORNER);
-
-            auto prior_ptr = cnnLayer.insData[idx_priors].lock();
-            if (!prior_ptr) {
-                THROW_IE_EXCEPTION << "Pointer to the input data of layer " << cnnLayer.name << " is exprired";
-            }
-            auto prior_dims = prior_ptr->getTensorDesc().getDims();
+            IE_ASSERT(4 == image_dims.size());
+
+            _image_height = image_dims[2];
+            _image_width = image_dims[3];
+
             IE_ASSERT(2 <=  prior_dims.size());
             int priors_size = prior_dims[prior_dims.size() - 2] * prior_dims[prior_dims.size() - 1];
 
-            auto loc_ptr = cnnLayer.insData[idx_location].lock();
-            if (!loc_ptr) {
-                THROW_IE_EXCEPTION << "Pointer to the input data of layer " << cnnLayer.name << " is exprired";
-            }
-            auto loc_dims = loc_ptr->getTensorDesc().getDims();
             IE_ASSERT(2 <= loc_dims.size());
             int loc_size = loc_dims[loc_dims.size() - 2]*loc_dims[loc_dims.size() - 1];
 
-            auto conf_ptr = cnnLayer.insData[idx_confidence].lock();
-            if (!conf_ptr) {
-                THROW_IE_EXCEPTION << "Pointer to the input data of layer " << cnnLayer.name << " is exprired";
-            }
-            auto conf_dims = conf_ptr->getTensorDesc().getDims();
             IE_ASSERT(2 <= conf_dims.size());
-            uint32_t conf_size = conf_dims[0]*conf_dims[1];
+            size_t conf_size = conf_dims[0]*conf_dims[1];
 
             _num_priors = static_cast<int>(priors_size / _prior_size);
 
+            // num_classes guessed from the output dims
+            if (loc_size % (_num_priors * 4) != 0) {
+                throw std::runtime_error("Can't guess number of classes. Something's wrong with output layers dims");
+            }
+
+            _num_classes = loc_size / (_num_priors * 4);
+            _num_loc_classes = _num_classes;
+
             if (_num_priors * _num_loc_classes * 4 != loc_size)
                 THROW_IE_EXCEPTION << "Number of priors must match number of location predictions.";
 
             if (_num_priors * _num_classes != static_cast<int>(conf_size))
                 THROW_IE_EXCEPTION << "Number of priors must match number of confidence predictions.";
 
-            _num = static_cast<int>(conf_size);
-
-            SizeVector bboxes_size{static_cast<size_t>(_num),
+            SizeVector bboxes_size{conf_size,
                                                     static_cast<size_t>(_num_classes),
                                                     static_cast<size_t>(_num_priors),
                                                     4};
             _decoded_bboxes = make_shared_blob<float>({Precision::FP32, bboxes_size, NCHW});
             _decoded_bboxes->allocate();
 
-            SizeVector buf_size{static_cast<size_t>(_num),
+            SizeVector buf_size{conf_size,
                                                  static_cast<size_t>(_num_classes),
                                                  static_cast<size_t>(_num_priors)};
             _buffer = make_shared_blob<int>({Precision::I32, buf_size, {buf_size, {0, 1, 2}}});
             _buffer->allocate();
 
-            SizeVector indices_size{static_cast<size_t>(_num),
+            SizeVector indices_size{conf_size,
                                                      static_cast<size_t>(_num_classes),
                                                      static_cast<size_t>(_num_priors)};
             _indices = make_shared_blob<int>(
                     {Precision::I32, indices_size, {indices_size, {0, 1, 2}}});
             _indices->allocate();
 
-            SizeVector detections_size{static_cast<size_t>(_num * _num_classes)};
+            SizeVector detections_size{conf_size * static_cast<size_t>(_num_classes)};
             _detections_count = make_shared_blob<int>({Precision::I32, detections_size, C});
             _detections_count->allocate();
 
@@ -115,14 +90,14 @@ class DetectionOutputPostProcessor {
             _reordered_conf = make_shared_blob<float>({Precision::FP32, conf_size1, ANY});
             _reordered_conf->allocate();
 
-            SizeVector decoded_bboxes_size{static_cast<size_t>(_num),
+            SizeVector decoded_bboxes_size{conf_size,
                                                             static_cast<size_t>(_num_priors),
                                                             static_cast<size_t>(_num_classes)};
             _bbox_sizes = make_shared_blob<float>(
                     {Precision::FP32, decoded_bboxes_size, {decoded_bboxes_size, {0, 1, 2}}});
             _bbox_sizes->allocate();
 
-            SizeVector num_priors_actual_size{static_cast<size_t>(_num)};
+            SizeVector num_priors_actual_size{conf_size};
             _num_priors_actual = make_shared_blob<int>({Precision::I32, num_priors_actual_size, C});
             _num_priors_actual->allocate();
         } catch (const InferenceEngineException& ex) {
@@ -152,22 +127,15 @@ class DetectionOutputPostProcessor {
         const float *ppriors = prior_data;
 
         for (int n = 0; n < N; ++n) {
-            if (_share_location) {
-                const float *ploc = loc_data + n*4*_num_priors;
-                float *pboxes = decoded_bboxes_data + n*4*_num_priors;
-                float *psizes = bbox_sizes_data + n*_num_priors;
-                decodeBBoxes(ppriors, ploc, prior_variances, pboxes, psizes, num_priors_actual, n);
-            } else {
-                for (int c = 0; c < _num_loc_classes; ++c) {
-                    if (c == _background_label_id) {
-                        continue;
-                    }
-
-                    const float *ploc = loc_data + n*4*_num_loc_classes*_num_priors + c*4;
-                    float *pboxes = decoded_bboxes_data + n*4*_num_loc_classes*_num_priors + c*4*_num_priors;
-                    float *psizes = bbox_sizes_data + n*_num_loc_classes*_num_priors + c*_num_priors;
-                    decodeBBoxes(ppriors, ploc, prior_variances, pboxes, psizes, num_priors_actual, n);
+            for (int c = 0; c < _num_loc_classes; ++c) {
+                if (c == _background_label_id) {
+                    continue;
                 }
+
+                const float *ploc = loc_data + n*4*_num_loc_classes*_num_priors + c*4;
+                float *pboxes = decoded_bboxes_data + n*4*_num_loc_classes*_num_priors + c*4*_num_priors;
+                float *psizes = bbox_sizes_data + n*_num_loc_classes*_num_priors + c*_num_priors;
+                decodeBBoxes(ppriors, ploc, prior_variances, pboxes, psizes, num_priors_actual, n);
             }
         }
 
@@ -195,15 +163,8 @@ class DetectionOutputPostProcessor {
                 int *pdetections = detections_data + n*_num_classes + c;
 
                 const float *pconf = reordered_conf_data + n*_num_classes*_num_priors + c*_num_priors;
-                const float *pboxes;
-                const float *psizes;
-                if (_share_location) {
-                    pboxes = decoded_bboxes_data + n*4*_num_priors;
-                    psizes = bbox_sizes_data + n*_num_priors;
-                } else {
-                    pboxes = decoded_bboxes_data + n*4*_num_classes*_num_priors + c*4*_num_priors;
-                    psizes = bbox_sizes_data + n*_num_classes*_num_priors + c*_num_priors;
-                }
+                const float *pboxes = decoded_bboxes_data + n*4*_num_classes*_num_priors + c*4*_num_priors;
+                const float *psizes = bbox_sizes_data + n*_num_classes*_num_priors + c*_num_priors;
 
                 nms(pconf, pboxes, psizes, pbuffer, pindices, *pdetections, num_priors_actual[n]);
             }
@@ -270,14 +231,10 @@ class DetectionOutputPostProcessor {
                     dst_data[count * DETECTION_SIZE + 1] = static_cast<float>(c);
                     dst_data[count * DETECTION_SIZE + 2] = pconf[c*_num_priors + idx];
 
-                    float xmin = _share_location ? pboxes[idx*4 + 0] :
-                                 pboxes[c*4*_num_priors + idx*4 + 0];
-                    float ymin = _share_location ? pboxes[idx*4 + 1] :
-                                 pboxes[c*4*_num_priors + idx*4 + 1];
-                    float xmax = _share_location ? pboxes[idx*4 + 2] :
-                                 pboxes[c*4*_num_priors + idx*4 + 2];
-                    float ymax = _share_location ? pboxes[idx*4 + 3] :
-                                 pboxes[c*4*_num_priors + idx*4 + 3];
+                    float xmin = pboxes[c*4*_num_priors + idx*4 + 0];
+                    float ymin = pboxes[c*4*_num_priors + idx*4 + 1];
+                    float xmax = pboxes[c*4*_num_priors + idx*4 + 2];
+                    float ymax = pboxes[c*4*_num_priors + idx*4 + 3];
 
                     dst_data[count * DETECTION_SIZE + 3] = xmin;
                     dst_data[count * DETECTION_SIZE + 4] = ymin;
@@ -304,32 +261,21 @@ class DetectionOutputPostProcessor {
 
 
     int _num_classes = 0;
-    int _background_label_id = 0;
-    int _top_k = 0;
-    int _variance_encoded_in_target = 0;
-    int _keep_top_k = 0;
-    int _code_type = 0;
-
-    bool _share_location = false;
+    const int _background_label_id = 0;
+    const int _top_k = 400;
+    const int _keep_top_k = 200;
 
     int _image_width = 0;
     int _image_height = 0;
-    int _prior_size = 4;
-    bool _normalized = true;
-    int _offset = 0;
+    const int _prior_size = 5;
+    const int _offset = 1;
 
-    float _nms_threshold = 0.0f;
-    float _confidence_threshold = 0.0f;
+    const float _nms_threshold = 0.3f;
+    const float _confidence_threshold = -FLT_MAX;
 
-    int _num = 0;
     int _num_loc_classes = 0;
     int _num_priors = 0;
 
-    enum CodeType {
-        CORNER = 1,
-        CENTER_SIZE = 2,
-    };
-
     void decodeBBoxes(const float *prior_data, const float *loc_data, const float *variance_data,
                       float *decoded_bboxes, float *decoded_bbox_sizes, int* num_priors_actual, int n);
 
@@ -402,23 +348,16 @@ void DetectionOutputPostProcessor::decodeBBoxes(const float *prior_data,
                                    int* num_priors_actual,
                                    int n) {
     num_priors_actual[n] = _num_priors;
-    if (!_normalized) {
-        int num = 0;
-        for (; num < _num_priors; ++num) {
-            float batch_id = prior_data[num * _prior_size + 0];
-            if (batch_id == -1.f) {
-                num_priors_actual[n] = num;
-                break;
-            }
+
+    for (int num = 0; num < _num_priors; ++num) {
+        float batch_id = prior_data[num * _prior_size + 0];
+        if (batch_id == -1.f) {
+            num_priors_actual[n] = num;
+            break;
         }
     }
 
     for (int p = 0; p < num_priors_actual[n]; ++p) {
-        float new_xmin = 0.0f;
-        float new_ymin = 0.0f;
-        float new_xmax = 0.0f;
-        float new_ymax = 0.0f;
-
         float prior_xmin = prior_data[p*_prior_size + 0 + _offset];
         float prior_ymin = prior_data[p*_prior_size + 1 + _offset];
         float prior_xmax = prior_data[p*_prior_size + 2 + _offset];
@@ -429,54 +368,29 @@ void DetectionOutputPostProcessor::decodeBBoxes(const float *prior_data,
         float loc_xmax = loc_data[4*p*_num_loc_classes + 2];
         float loc_ymax = loc_data[4*p*_num_loc_classes + 3];
 
-        if (!_normalized) {
-            prior_xmin /= _image_width;
-            prior_ymin /= _image_height;
-            prior_xmax /= _image_width;
-            prior_ymax /= _image_height;
-        }
-
-        if (_code_type == CodeType::CORNER) {
-            if (_variance_encoded_in_target) {
-                // variance is encoded in target, we simply need to add the offset predictions.
-                new_xmin = prior_xmin + loc_xmin;
-                new_ymin = prior_ymin + loc_ymin;
-                new_xmax = prior_xmax + loc_xmax;
-                new_ymax = prior_ymax + loc_ymax;
-            } else {
-                new_xmin = prior_xmin + variance_data[p*4 + 0] * loc_xmin;
-                new_ymin = prior_ymin + variance_data[p*4 + 1] * loc_ymin;
-                new_xmax = prior_xmax + variance_data[p*4 + 2] * loc_xmax;
-                new_ymax = prior_ymax + variance_data[p*4 + 3] * loc_ymax;
-            }
-        } else if (_code_type == CodeType::CENTER_SIZE) {
-            float prior_width    =  prior_xmax - prior_xmin;
-            float prior_height   =  prior_ymax - prior_ymin;
-            float prior_center_x = (prior_xmin + prior_xmax) / 2.0f;
-            float prior_center_y = (prior_ymin + prior_ymax) / 2.0f;
-
-            float decode_bbox_center_x, decode_bbox_center_y;
-            float decode_bbox_width, decode_bbox_height;
-
-            if (_variance_encoded_in_target) {
-                // variance is encoded in target, we simply need to restore the offset predictions.
-                decode_bbox_center_x = loc_xmin * prior_width  + prior_center_x;
-                decode_bbox_center_y = loc_ymin * prior_height + prior_center_y;
-                decode_bbox_width  = std::exp(loc_xmax) * prior_width;
-                decode_bbox_height = std::exp(loc_ymax) * prior_height;
-            } else {
-                // variance is encoded in bbox, we need to scale the offset accordingly.
-                decode_bbox_center_x = variance_data[p*4 + 0] * loc_xmin * prior_width + prior_center_x;
-                decode_bbox_center_y = variance_data[p*4 + 1] * loc_ymin * prior_height + prior_center_y;
-                decode_bbox_width    = std::exp(variance_data[p*4 + 2] * loc_xmax) * prior_width;
-                decode_bbox_height   = std::exp(variance_data[p*4 + 3] * loc_ymax) * prior_height;
-            }
-
-            new_xmin = decode_bbox_center_x - decode_bbox_width  / 2.0f;
-            new_ymin = decode_bbox_center_y - decode_bbox_height / 2.0f;
-            new_xmax = decode_bbox_center_x + decode_bbox_width  / 2.0f;
-            new_ymax = decode_bbox_center_y + decode_bbox_height / 2.0f;
-        }
+        prior_xmin /= _image_width;
+        prior_ymin /= _image_height;
+        prior_xmax /= _image_width;
+        prior_ymax /= _image_height;
+
+        float prior_width    =  prior_xmax - prior_xmin;
+        float prior_height   =  prior_ymax - prior_ymin;
+        float prior_center_x = (prior_xmin + prior_xmax) / 2.0f;
+        float prior_center_y = (prior_ymin + prior_ymax) / 2.0f;
+
+        float decode_bbox_center_x, decode_bbox_center_y;
+        float decode_bbox_width, decode_bbox_height;
+
+        // variance is encoded in target, we simply need to restore the offset predictions.
+        decode_bbox_center_x = loc_xmin * prior_width  + prior_center_x;
+        decode_bbox_center_y = loc_ymin * prior_height + prior_center_y;
+        decode_bbox_width  = std::exp(loc_xmax) * prior_width;
+        decode_bbox_height = std::exp(loc_ymax) * prior_height;
+
+        float new_xmin = decode_bbox_center_x - decode_bbox_width  / 2.0f;
+        float new_ymin = decode_bbox_center_y - decode_bbox_height / 2.0f;
+        float new_xmax = decode_bbox_center_x + decode_bbox_width  / 2.0f;
+        float new_ymax = decode_bbox_center_y + decode_bbox_height / 2.0f;
 
         decoded_bboxes[p*4 + 0] = new_xmin;
         decoded_bboxes[p*4 + 1] = new_ymin;
diff --git a/demos/object_detection_demo_faster_rcnn/main.cpp b/demos/object_detection_demo_faster_rcnn/main.cpp
index cbc444f2502..b5db5203c09 100644
--- a/demos/object_detection_demo_faster_rcnn/main.cpp
+++ b/demos/object_detection_demo_faster_rcnn/main.cpp
@@ -10,13 +10,13 @@
 #include <vector>
 #include <limits>
 
-#include <format_reader_ptr.h>
 #include <inference_engine.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
-#include <samples/common.hpp>
+#include <opencv2/core.hpp>
+#include <opencv2/imgcodecs.hpp>
+#include <opencv2/imgproc.hpp>
+
+#include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
 #include <samples/args_helper.hpp>
 #include "object_detection_demo_faster_rcnn.h"
@@ -65,9 +65,9 @@ int main(int argc, char *argv[]) {
         }
 
         /** This vector stores paths to the processed images **/
-        std::vector<std::string> images;
-        parseInputFilesArguments(images);
-        if (images.empty()) throw std::logic_error("No suitable images were found");
+        std::vector<std::string> imagePaths;
+        parseInputFilesArguments(imagePaths);
+        if (imagePaths.empty()) throw std::logic_error("No suitable images were found");
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 1. Load inference engine -------------------------------------
@@ -78,18 +78,6 @@ int main(int argc, char *argv[]) {
             ie.SetLogCallback(error_listener);
         }
 
-#ifdef WITH_EXTENSIONS
-        /*If CPU device, load default library with extensions that comes with the product*/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-            * cpu_extensions library is compiled from "extension" folder containing
-            * custom MKLDNNPlugin layer implementations. These layers are not supported
-            * by mkldnn, but they can be useful for inferencing custom topologies.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
             IExtensionPtr extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -109,110 +97,17 @@ int main(int argc, char *argv[]) {
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 2. Read IR Generated by ModelOptimizer (.xml and .bin files) ------------
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        slog::info << "Loading network files:"
+        slog::info << "Loading network file:"
             "\n\t" << FLAGS_m <<
-            "\n\t" << binFileName <<
             slog::endl;
 
-        CNNNetReader networkReader;
         /** Read network model **/
-        networkReader.ReadNetwork(FLAGS_m);
+        CNNNetwork network = ie.ReadNetwork(FLAGS_m);
 
-        /** Extract model name and load weigts **/
-        networkReader.ReadWeights(binFileName);
-        CNNNetwork network = networkReader.getNetwork();
-
-        Precision precision = network.getPrecision();
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 3. Configure input & output ---------------------------------------------
 
-        // ------------------------------ Adding DetectionOutput -----------------------------------------------
-
-        /**
-         * The only meaningful difference between Faster-RCNN and SSD-like topologies is the interpretation
-         * of the output data. Faster-RCNN has 2 output layers which (the same format) are presented inside SSD.
-         *
-         * But SSD has an additional post-processing DetectionOutput layer that simplifies output filtering.
-         * So here we are adding 3 Reshapes and the DetectionOutput to the end of Faster-RCNN so it will return the
-         * same result as SSD and we can easily parse it.
-         */
-
-        std::string firstLayerName = network.getInputsInfo().begin()->first;
-
-        int inputWidth = network.getInputsInfo().begin()->second->getTensorDesc().getDims()[3];
-        int inputHeight = network.getInputsInfo().begin()->second->getTensorDesc().getDims()[2];
-
-        DataPtr bbox_pred_reshapeInPort = ((ICNNNetwork&)network).getData(FLAGS_bbox_name.c_str());
-        if (bbox_pred_reshapeInPort == nullptr) {
-            throw std::logic_error(std::string("Can't find output layer named ") + FLAGS_bbox_name);
-        }
-
-        SizeVector bbox_pred_reshapeOutDims = {
-            bbox_pred_reshapeInPort->getTensorDesc().getDims()[0] *
-            bbox_pred_reshapeInPort->getTensorDesc().getDims()[1], 1
-        };
-        DataPtr rois_reshapeInPort = ((ICNNNetwork&)network).getData(FLAGS_proposal_name.c_str());
-        if (rois_reshapeInPort == nullptr) {
-            throw std::logic_error(std::string("Can't find output layer named ") + FLAGS_proposal_name);
-        }
-
-        SizeVector rois_reshapeOutDims = {rois_reshapeInPort->getTensorDesc().getDims()[0] * rois_reshapeInPort->getTensorDesc().getDims()[1], 1};
-
-        DataPtr cls_prob_reshapeInPort = ((ICNNNetwork&)network).getData(FLAGS_prob_name.c_str());
-        if (cls_prob_reshapeInPort == nullptr) {
-            throw std::logic_error(std::string("Can't find output layer named ") + FLAGS_prob_name);
-        }
-
-        SizeVector cls_prob_reshapeOutDims = {cls_prob_reshapeInPort->getTensorDesc().getDims()[0] * cls_prob_reshapeInPort->getTensorDesc().getDims()[1], 1};
-
-        /*
-            Detection output
-        */
-
-        int normalized = 0;
-        int prior_size = normalized ? 4 : 5;
-        int num_priors = rois_reshapeOutDims[0] / prior_size;
-
-        // num_classes guessed from the output dims
-        if (bbox_pred_reshapeOutDims[0] % (num_priors * 4) != 0) {
-            throw std::logic_error("Can't guess number of classes. Something's wrong with output layers dims");
-        }
-        int num_classes = bbox_pred_reshapeOutDims[0] / (num_priors * 4);
-        slog::info << "num_classes guessed: " << num_classes << slog::endl;
-
-        LayerParams detectionOutParams;
-        detectionOutParams.name = "detection_out";
-        detectionOutParams.type = "DetectionOutput";
-        detectionOutParams.precision = precision;
-        CNNLayerPtr detectionOutLayer = CNNLayerPtr(new CNNLayer(detectionOutParams));
-        detectionOutLayer->params["background_label_id"] = "0";
-        detectionOutLayer->params["code_type"] = "caffe.PriorBoxParameter.CENTER_SIZE";
-        detectionOutLayer->params["eta"] = "1.0";
-        detectionOutLayer->params["input_height"] = std::to_string(inputHeight);
-        detectionOutLayer->params["input_width"] = std::to_string(inputWidth);
-        detectionOutLayer->params["keep_top_k"] = "200";
-        detectionOutLayer->params["nms_threshold"] = "0.3";
-        detectionOutLayer->params["normalized"] = std::to_string(normalized);
-        detectionOutLayer->params["num_classes"] = std::to_string(num_classes);
-        detectionOutLayer->params["share_location"] = "0";
-        detectionOutLayer->params["top_k"] = "400";
-        detectionOutLayer->params["variance_encoded_in_target"] = "1";
-        detectionOutLayer->params["visualize"] = "False";
-
-        detectionOutLayer->insData.push_back(bbox_pred_reshapeInPort);
-        detectionOutLayer->insData.push_back(cls_prob_reshapeInPort);
-        detectionOutLayer->insData.push_back(rois_reshapeInPort);
-
-        SizeVector detectionOutLayerOutDims = {1, 1, 200, 7};
-        DataPtr detectionOutLayerOutPort = DataPtr(new Data("detection_out", detectionOutLayerOutDims, precision,
-                                                            TensorDesc::getLayoutByDims(detectionOutLayerOutDims)));
-        detectionOutLayerOutPort->getCreatorLayer() = detectionOutLayer;
-        detectionOutLayer->outData.push_back(detectionOutLayerOutPort);
-
-        DetectionOutputPostProcessor detOutPostProcessor(detectionOutLayer.get());
-
         network.addOutput(FLAGS_bbox_name, 0);
         network.addOutput(FLAGS_prob_name, 0);
         network.addOutput(FLAGS_proposal_name, 0);
@@ -228,9 +123,6 @@ int main(int argc, char *argv[]) {
 
         std::string imageInputName, imInfoInputName;
 
-        InputInfo::Ptr inputInfo = inputsInfo.begin()->second;
-
-        SizeVector inputImageDims;
         /** Stores input image **/
 
         /** Iterating over all input blobs **/
@@ -239,7 +131,7 @@ int main(int argc, char *argv[]) {
             if (item.second->getInputData()->getTensorDesc().getDims().size() == 4) {
                 imageInputName = item.first;
 
-                slog::info << "Batch size is " << std::to_string(networkReader.getNetwork().getBatchSize()) << slog::endl;
+                slog::info << "Batch size is " << std::to_string(network.getBatchSize()) << slog::endl;
 
                 /** Creating first input blob **/
                 Precision inputPrecision = Precision::U8;
@@ -262,8 +154,8 @@ int main(int argc, char *argv[]) {
 
         OutputsDataMap outputsInfo(network.getOutputsInfo());
 
-        const int maxProposalCount = detectionOutLayerOutDims[2];
-        const int objectSize = detectionOutLayerOutDims[3];
+        const size_t maxProposalCount = 200;
+        const size_t objectSize = 7;
 
         /** Set the precision of output data provided by the user, should be called before load of the network to the device **/
 
@@ -272,6 +164,23 @@ int main(int argc, char *argv[]) {
         outputsInfo[FLAGS_proposal_name]->setPrecision(Precision::FP32);
         // -----------------------------------------------------------------------------------------------------
 
+        // ------------------------------ Adding DetectionOutput post-processor---------------------------------
+
+        /**
+         * The only meaningful difference between Faster-RCNN and SSD-like topologies is the interpretation
+         * of the output data. Faster-RCNN has 2 output layers which (the same format) are presented inside SSD.
+         *
+         * But SSD has an additional post-processing DetectionOutput layer that simplifies output filtering.
+         * So here we use a post-processor to convert the output of Faster-RCNN into the same format as SSD,
+         * so that we can easily parse it.
+         */
+
+        DetectionOutputPostProcessor detOutPostProcessor(
+            inputsInfo[imageInputName]->getTensorDesc().getDims(),
+            outputsInfo[FLAGS_bbox_name]->getTensorDesc().getDims(),
+            outputsInfo[FLAGS_prob_name]->getTensorDesc().getDims(),
+            outputsInfo[FLAGS_proposal_name]->getTensorDesc().getDims());
+
         // --------------------------- 4. Loading model to the device ------------------------------------------
         slog::info << "Loading model to the device" << slog::endl;
         ExecutableNetwork executable_network = ie.LoadNetwork(network, FLAGS_d);
@@ -283,56 +192,32 @@ int main(int argc, char *argv[]) {
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 6. Prepare input --------------------------------------------------------
-        /** Collect images data ptrs **/
-        std::vector<std::shared_ptr<unsigned char>> imagesData, originalImagesData;
-        std::vector<size_t> imageWidths, imageHeights;
-        for (auto & i : images) {
-            FormatReader::ReaderPtr reader(i.c_str());
-            if (reader.get() == nullptr) {
-                slog::warn << "Image " + i + " cannot be read!" << slog::endl;
+        /** Collect images **/
+        std::vector<cv::Mat> images;
+        for (auto &path: imagePaths) {
+            cv::Mat image = cv::imread(path, cv::IMREAD_COLOR);
+            if (image.empty()) {
+                slog::warn << "Image " + path + " cannot be read!" << slog::endl;
                 continue;
             }
-            /** Store image data **/
-            std::shared_ptr<unsigned char> originalData(reader->getData());
-            std::shared_ptr<unsigned char> data(reader->getData(inputInfo->getTensorDesc().getDims()[3], inputInfo->getTensorDesc().getDims()[2]));
-            if (data.get() != nullptr) {
-                originalImagesData.push_back(originalData);
-                imagesData.push_back(data);
-                imageWidths.push_back(reader->width());
-                imageHeights.push_back(reader->height());
-            }
+            images.push_back(image);
         }
-        if (imagesData.empty()) throw std::logic_error("Valid input images were not found!");
+        if (images.empty()) throw std::logic_error("Valid input images were not found!");
 
         size_t batchSize = network.getBatchSize();
         slog::info << "Batch size is " << std::to_string(batchSize) << slog::endl;
-        if (batchSize != imagesData.size()) {
-            slog::warn << "Number of images " + std::to_string(imagesData.size()) + \
+        if (batchSize != images.size()) {
+            slog::warn << "Number of images " + std::to_string(images.size()) +
                 " doesn't match batch size " + std::to_string(batchSize) << slog::endl;
-            batchSize = std::min(batchSize, imagesData.size());
+            batchSize = std::min(batchSize, images.size());
             slog::warn << "Number of images to be processed is "<< std::to_string(batchSize) << slog::endl;
         }
 
-        /** Creating input blob **/
+        /** Filling input tensor with images **/
         Blob::Ptr imageInput = infer_request.GetBlob(imageInputName);
 
-        /** Filling input tensor with images. First b channel, then g and r channels **/
-        size_t num_channels = imageInput->getTensorDesc().getDims()[1];
-        size_t image_size = imageInput->getTensorDesc().getDims()[3] * imageInput->getTensorDesc().getDims()[2];
-
-        unsigned char* data = static_cast<unsigned char*>(imageInput->buffer());
-
-        /** Iterate over all input images **/
-        for (size_t image_id = 0; image_id < std::min(imagesData.size(), batchSize); ++image_id) {
-            /** Iterate over all pixel in image (b,g,r) **/
-            for (size_t pid = 0; pid < image_size; pid++) {
-                /** Iterate over all channels **/
-                for (size_t ch = 0; ch < num_channels; ++ch) {
-                    /**          [images stride + channels stride + pixel id ] all in bytes            **/
-                    data[image_id * image_size * num_channels + ch * image_size + pid] = imagesData.at(image_id).get()[pid*num_channels + ch];
-                }
-            }
-        }
+        for (size_t image_id = 0; image_id < std::min(images.size(), batchSize); ++image_id)
+            matU8ToBlob<unsigned char>(images[image_id], imageInput, image_id);
 
         if (!imInfoInputName.empty()) {
             Blob::Ptr input2 = infer_request.GetBlob(imInfoInputName);
@@ -341,7 +226,7 @@ int main(int argc, char *argv[]) {
             /** Fill input tensor with values **/
             float *p = input2->buffer().as<PrecisionTrait<Precision::FP32>::value_type*>();
 
-            for (size_t image_id = 0; image_id < std::min(imagesData.size(), batchSize); ++image_id) {
+            for (size_t image_id = 0; image_id < std::min(images.size(), batchSize); ++image_id) {
                 p[image_id * imInfoDim + 0] = static_cast<float>(inputsInfo[imageInputName]->getTensorDesc().getDims()[2]);
                 p[image_id * imInfoDim + 1] = static_cast<float>(inputsInfo[imageInputName]->getTensorDesc().getDims()[3]);
                 for (size_t k = 2; k < imInfoDim; k++) {
@@ -365,7 +250,7 @@ int main(int argc, char *argv[]) {
 
         std::vector<Blob::Ptr> detOutInBlobs = { bbox_output_blob, prob_output_blob, rois_output_blob };
 
-        Blob::Ptr output_blob = std::make_shared<TBlob<float>>(TensorDesc(Precision::FP32, detectionOutLayerOutDims, Layout::NCHW));
+        Blob::Ptr output_blob = std::make_shared<TBlob<float>>(TensorDesc(Precision::FP32, {1, 1, maxProposalCount, objectSize}, Layout::NCHW));
         output_blob->allocate();
         std::vector<Blob::Ptr> detOutOutBlobs = { output_blob };
 
@@ -373,11 +258,8 @@ int main(int argc, char *argv[]) {
 
         const float* detection = static_cast<PrecisionTrait<Precision::FP32>::value_type*>(output_blob->buffer());
 
-        std::vector<std::vector<int> > boxes(batchSize);
-        std::vector<std::vector<int> > classes(batchSize);
-
         /* Each detection has image_id that denotes processed image */
-        for (int curProposal = 0; curProposal < maxProposalCount; curProposal++) {
+        for (size_t curProposal = 0; curProposal < maxProposalCount; curProposal++) {
             auto image_id = static_cast<int>(detection[curProposal * objectSize + 0]);
             if (image_id < 0) {
                 break;
@@ -385,30 +267,30 @@ int main(int argc, char *argv[]) {
 
             float confidence = detection[curProposal * objectSize + 2];
             auto label = static_cast<int>(detection[curProposal * objectSize + 1]);
-            auto xmin = static_cast<int>(detection[curProposal * objectSize + 3] * imageWidths[image_id]);
-            auto ymin = static_cast<int>(detection[curProposal * objectSize + 4] * imageHeights[image_id]);
-            auto xmax = static_cast<int>(detection[curProposal * objectSize + 5] * imageWidths[image_id]);
-            auto ymax = static_cast<int>(detection[curProposal * objectSize + 6] * imageHeights[image_id]);
+            auto xmin = static_cast<int>(detection[curProposal * objectSize + 3] * images[image_id].cols);
+            auto ymin = static_cast<int>(detection[curProposal * objectSize + 4] * images[image_id].rows);
+            auto xmax = static_cast<int>(detection[curProposal * objectSize + 5] * images[image_id].cols);
+            auto ymax = static_cast<int>(detection[curProposal * objectSize + 6] * images[image_id].rows);
 
             std::cout << "[" << curProposal << "," << label << "] element, prob = " << confidence <<
                 "    (" << xmin << "," << ymin << ")-(" << xmax << "," << ymax << ")" << " batch id : " << image_id;
 
             if (confidence > 0.5) {
                 /** Drawing only objects with >50% probability **/
-                classes[image_id].push_back(label);
-                boxes[image_id].push_back(xmin);
-                boxes[image_id].push_back(ymin);
-                boxes[image_id].push_back(xmax - xmin);
-                boxes[image_id].push_back(ymax - ymin);
                 std::cout << " WILL BE PRINTED!";
+
+                const auto &color = CITYSCAPES_COLORS[label % arraySize(CITYSCAPES_COLORS)];
+                cv::rectangle(images[image_id],
+                    cv::Point(xmin, ymin), cv::Point(xmax, ymax),
+                    cv::Scalar(color.blue(), color.green(), color.red()));
             }
             std::cout << std::endl;
         }
 
         for (size_t batch_id = 0; batch_id < batchSize; ++batch_id) {
-            addRectangles(originalImagesData[batch_id].get(), imageHeights[batch_id], imageWidths[batch_id], boxes[batch_id], classes[batch_id]);
             const std::string image_path = "out_" + std::to_string(batch_id) + ".bmp";
-            if (writeOutputBmp(image_path, originalImagesData[batch_id].get(), imageHeights[batch_id], imageWidths[batch_id])) {
+
+            if (cv::imwrite(image_path, images[batch_id])) {
                 slog::info << "Image " + image_path + " created!" << slog::endl;
             } else {
                 throw std::logic_error(std::string("Can't create a file: ") + image_path);
diff --git a/demos/object_detection_demo_faster_rcnn/object_detection_demo_faster_rcnn.h b/demos/object_detection_demo_faster_rcnn/object_detection_demo_faster_rcnn.h
index acdf2d878f7..9071f555e3c 100644
--- a/demos/object_detection_demo_faster_rcnn/object_detection_demo_faster_rcnn.h
+++ b/demos/object_detection_demo_faster_rcnn/object_detection_demo_faster_rcnn.h
@@ -14,73 +14,30 @@
 #include <limits>
 #include <chrono>
 
-#include <format_reader_ptr.h>
-#include <inference_engine.hpp>
-
-#include "samples/common.hpp"
-
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
 static const char image_message[] = "Required. Path to a .bmp image.";
-
-/// @brief message for model argument
 static const char model_message[] = "Required. Path to an .xml file with a trained model.";
-
-/// @brief message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to the .xml file with the kernels descriptions.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementations.";
-
-/// @brief message for bbox layer name argument
+static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device.";
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to the .xml file with the kernels descriptions.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementations.";
 static const char bbox_layer_name_message[] = "Optional. The name of output box prediction layer. Default value is \"bbox_pred\"";
-/// @brief message for proposal layer name argument
 static const char proposal_layer_name_message[] = "Optional. The name of output proposal layer. Default value is \"proposal\"";
-/// @brief message for prob layer name argument
 static const char prob_layer_name_message[] = "Optional. The name of output probability layer. Default value is \"cls_prob\"";
-
-/// @brief message for plugin messages
 static const char plugin_message[] = "Optional. Enables messages from a plugin";
 
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "", image_message);
-
-/// @brief Define parameter for set model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", model_message);
-
-/// @brief device the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief Define parameter for clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Custom bbox layer name
 DEFINE_string(bbox_name, "bbox_pred", bbox_layer_name_message);
-/// @brief Custom proposal layer name
 DEFINE_string(proposal_name, "proposal", proposal_layer_name_message);
-/// @brief Custom prob layer name
 DEFINE_string(prob_name, "cls_prob", prob_layer_name_message);
-
-/// @brief Enable plugin messages
 DEFINE_bool(p_msg, false, plugin_message);
 
 /**
diff --git a/demos/object_detection_demo_ssd_async/CMakeLists.txt b/demos/object_detection_demo_ssd_async/CMakeLists.txt
index 0174d9d69e8..37249579fcb 100644
--- a/demos/object_detection_demo_ssd_async/CMakeLists.txt
+++ b/demos/object_detection_demo_ssd_async/CMakeLists.txt
@@ -5,4 +5,5 @@
 ie_add_sample(NAME object_detection_demo_ssd_async
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/object_detection_demo_ssd_async.hpp"
-              OPENCV_DEPENDENCIES highgui videoio imgproc)
\ No newline at end of file
+              DEPENDENCIES monitors
+              OPENCV_DEPENDENCIES highgui videoio imgproc)
diff --git a/demos/object_detection_demo_ssd_async/README.md b/demos/object_detection_demo_ssd_async/README.md
index 92101a7f633..8320972cabf 100644
--- a/demos/object_detection_demo_ssd_async/README.md
+++ b/demos/object_detection_demo_ssd_async/README.md
@@ -72,9 +72,8 @@ In a mean time your app can continue :
 
 ```cpp
 // load network
-CNNNetReader network_reader;
-network_reader.ReadNetwork("Model.xml");
-network_reader.ReadWeights("Model.bin");
+InferenceEngine::Core ie;
+auto network = ie.ReadNetwork("Model.xml");
 // populate inputs etc
 auto input = async_infer_request.GetBlob(input_name);
 ...
@@ -100,7 +99,7 @@ For more details on the requests-based Inference Engine API, including the Async
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./object_detection_demo_ssd_async -h
 InferenceEngine:
     API version ............ <version>
@@ -121,6 +120,7 @@ Options:
     -t                        Optional. Probability threshold for detections.
     -auto_resize              Optional. Enables resizable input with support of ROI crop & auto resize.
     -no_show                  Optional. Do not show processed video.
+    -u                        Optional. List of monitors to show initially.
 ```
 
 Running the application with the empty list of options yields the usage message given above and an error message.
diff --git a/demos/object_detection_demo_ssd_async/main.cpp b/demos/object_detection_demo_ssd_async/main.cpp
index 1200b216a56..1133f2a8db6 100644
--- a/demos/object_detection_demo_ssd_async/main.cpp
+++ b/demos/object_detection_demo_ssd_async/main.cpp
@@ -19,13 +19,11 @@
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
 
 #include "object_detection_demo_ssd_async.hpp"
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 using namespace InferenceEngine;
 
@@ -100,18 +98,6 @@ int main(int argc, char *argv[]) {
 
         /** Load extensions for the plugin **/
 
-#ifdef WITH_EXTENSIONS
-        /** Loading default extensions **/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-             * cpu_extensions library is compiled from "extension" folder containing
-             * custom MKLDNNPlugin layer implementations. These layers are not supported
-             * by mkldnn, but they can be useful for inferring custom topologies.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
             IExtensionPtr extension_ptr = make_so_pointer<IExtension>(FLAGS_l.c_str());
@@ -130,15 +116,11 @@ int main(int argc, char *argv[]) {
 
         // --------------------------- 2. Read IR Generated by ModelOptimizer (.xml and .bin files) ------------
         slog::info << "Loading network files" << slog::endl;
-        CNNNetReader netReader;
         /** Read network model **/
-        netReader.ReadNetwork(FLAGS_m);
+        auto cnnNetwork = ie.ReadNetwork(FLAGS_m);
         /** Set batch size to 1 **/
         slog::info << "Batch size is forced to  1." << slog::endl;
-        netReader.getNetwork().setBatchSize(1);
-        /** Extract model name and load it's weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        netReader.ReadWeights(binFileName);
+        cnnNetwork.setBatchSize(1);
         /** Read labels (if any)**/
         std::string labelFileName = fileNameNoExt(FLAGS_m) + ".labels";
         std::vector<std::string> labels;
@@ -152,7 +134,7 @@ int main(int argc, char *argv[]) {
         // --------------------------- 3. Configure input & output ---------------------------------------------
         // --------------------------- Prepare input blobs -----------------------------------------------------
         slog::info << "Checking that the inputs are as the demo expects" << slog::endl;
-        InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
 
         std::string imageInputName, imageInfoInputName;
         size_t netInputHeight, netInputWidth;
@@ -183,13 +165,13 @@ int main(int argc, char *argv[]) {
 
         // --------------------------- Prepare output blobs -----------------------------------------------------
         slog::info << "Checking that the outputs are as the demo expects" << slog::endl;
-        OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        OutputsDataMap outputInfo(cnnNetwork.getOutputsInfo());
         if (outputInfo.size() != 1) {
             throw std::logic_error("This demo accepts networks having only one output");
         }
         DataPtr& output = outputInfo.begin()->second;
         auto outputName = outputInfo.begin()->first;
-        const int num_classes = netReader.getNetwork().getLayerByName(outputName.c_str())->GetParamAsInt("num_classes");
+        const int num_classes = cnnNetwork.getLayerByName(outputName.c_str())->GetParamAsInt("num_classes");
         if (static_cast<int>(labels.size()) != num_classes) {
             if (static_cast<int>(labels.size()) == (num_classes - 1))  // if network assumes default "background" class, having no label
                 labels.insert(labels.begin(), "fake");
@@ -211,7 +193,7 @@ int main(int argc, char *argv[]) {
 
         // --------------------------- 4. Loading model to the device ------------------------------------------
         slog::info << "Loading model to the device" << slog::endl;
-        ExecutableNetwork network = ie.LoadNetwork(netReader.getNetwork(), FLAGS_d);
+        ExecutableNetwork network = ie.LoadNetwork(cnnNetwork, FLAGS_d);
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 5. Create infer request -------------------------------------------------
@@ -242,10 +224,12 @@ int main(int argc, char *argv[]) {
         typedef std::chrono::duration<double, std::ratio<1, 1000>> ms;
         auto total_t0 = std::chrono::high_resolution_clock::now();
         auto wallclock = std::chrono::high_resolution_clock::now();
-        double ocv_decode_time = 0, ocv_render_time = 0;
+        double ocv_render_time = 0;
 
         std::cout << "To close the application, press 'CTRL+C' here or switch to the output window and press ESC key" << std::endl;
         std::cout << "To switch between sync/async modes, press TAB key in the output window" << std::endl;
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, static_cast<int>(cap.get(cv::CAP_PROP_FRAME_HEIGHT)) - graphSize.height - 10, graphSize);
         while (true) {
             auto t0 = std::chrono::high_resolution_clock::now();
             // Here is the first asynchronous point:
@@ -270,7 +254,7 @@ int main(int argc, char *argv[]) {
             }
 
             auto t1 = std::chrono::high_resolution_clock::now();
-            ocv_decode_time = std::chrono::duration_cast<ms>(t1 - t0).count();
+            double ocv_decode_time = std::chrono::duration_cast<ms>(t1 - t0).count();
 
             t0 = std::chrono::high_resolution_clock::now();
             // Main sync point:
@@ -296,6 +280,9 @@ int main(int argc, char *argv[]) {
                 wallclock = t0;
 
                 t0 = std::chrono::high_resolution_clock::now();
+
+                presenter.drawGraphs(curr_frame);
+
                 std::ostringstream out;
                 out << "OpenCV cap/render time: " << std::fixed << std::setprecision(2)
                     << (ocv_decode_time + ocv_render_time) << " ms";
@@ -348,6 +335,7 @@ int main(int argc, char *argv[]) {
                     }
                 }
             }
+
             if (!FLAGS_no_show) {
                 cv::imshow("Detection results", curr_frame);
             }
@@ -377,6 +365,8 @@ int main(int argc, char *argv[]) {
             if (9 == key) {  // Tab
                 isAsyncMode ^= true;
                 isModeChanged = true;
+            } else {
+                presenter.handleKey(key);
             }
         }
         // -----------------------------------------------------------------------------------------------------
@@ -388,6 +378,7 @@ int main(int argc, char *argv[]) {
         if (FLAGS_pc) {
             printPerformanceCounts(*async_infer_request_curr, std::cout, getFullDeviceName(ie, FLAGS_d));
         }
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         std::cerr << "[ ERROR ] " << error.what() << std::endl;
diff --git a/demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.hpp b/demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.hpp
index f672f0d3e14..9bac75fbd6f 100644
--- a/demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.hpp
+++ b/demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.hpp
@@ -10,82 +10,35 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
 static const char video_message[] = "Required. Path to a video file (specify \"cam\" to work with camera).";
-
-/// @brief message for model argument
 static const char model_message[] = "Required. Path to an .xml file with a trained model.";
-
-/// @brief message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief message for performance counters
+static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device.";
 static const char performance_counter_message[] = "Optional. Enables per-layer performance report.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to the .xml file with the kernel descriptions.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernel implementations.";
-
-/// @brief message for probability threshold argument
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to the .xml file with the kernel descriptions.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernel implementations.";
 static const char thresh_output_message[] = "Optional. Probability threshold for detections.";
-/// @brief message raw output flag
 static const char raw_output_message[] = "Optional. Inference results as raw values.";
-
-/// @brief message resizable input flag
 static const char input_resizable_message[] = "Optional. Enables resizable input with support of ROI crop & auto resize.";
-
-/// @brief Message do not show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// \brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// \brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "", video_message);
-
-/// \brief Define parameter for set model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", model_message);
-
-/// \brief device the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief Enable per-layer performance report
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// \brief Flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, thresh_output_message);
-
-/// \brief Enables resizable input<br>
-/// It is an optional parameter
 DEFINE_bool(auto_resize, false, input_resizable_message);
-
-/// \brief Define a flag to disable showing processed video<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * \brief This function show a help message
@@ -107,4 +60,5 @@ static void showUsage() {
     std::cout << "    -t                        " << thresh_output_message << std::endl;
     std::cout << "    -auto_resize              " << input_resizable_message << std::endl;
     std::cout << "    -no_show                  " << no_show_processed_video << std::endl;
+    std::cout << "    -u                        " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/object_detection_demo_yolov3_async/CMakeLists.txt b/demos/object_detection_demo_yolov3_async/CMakeLists.txt
index 3c23d4d638d..6860f2fb8e1 100644
--- a/demos/object_detection_demo_yolov3_async/CMakeLists.txt
+++ b/demos/object_detection_demo_yolov3_async/CMakeLists.txt
@@ -5,4 +5,5 @@
 ie_add_sample(NAME object_detection_demo_yolov3_async
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/object_detection_demo_yolov3_async.hpp"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
\ No newline at end of file
diff --git a/demos/object_detection_demo_yolov3_async/README.md b/demos/object_detection_demo_yolov3_async/README.md
index 25d237d776d..755fbf4d9dc 100644
--- a/demos/object_detection_demo_yolov3_async/README.md
+++ b/demos/object_detection_demo_yolov3_async/README.md
@@ -25,7 +25,7 @@ Engine. Upon getting a frame from the OpenCV VideoCapture, it performs inference
 ## Running
 
 Running the application with the <code>-h</code> option yields the following usage message:
-```sh
+```
 ./object_detection_demo_yolov3_async -h
 InferenceEngine:
     API version ............ <version>
@@ -47,6 +47,7 @@ Options:
     -iou_t                    Optional. Filtering intersection over union threshold for overlapping boxes.
     -auto_resize              Optional. Enable resizable input with support of ROI crop and auto resize.
     -no_show                  Optional. Do not show processed video.
+    -u                        Optional. List of monitors to show initially.
 ```
 
 Running the application with the empty list of options yields the usage message given above and an error message.
diff --git a/demos/object_detection_demo_yolov3_async/main.cpp b/demos/object_detection_demo_yolov3_async/main.cpp
index d4a185324b1..bf3d9177041 100644
--- a/demos/object_detection_demo_yolov3_async/main.cpp
+++ b/demos/object_detection_demo_yolov3_async/main.cpp
@@ -21,15 +21,12 @@
 
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
 
 #include "object_detection_demo_yolov3_async.hpp"
 
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
-
 using namespace InferenceEngine;
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
@@ -206,17 +203,6 @@ int main(int argc, char *argv[]) {
 
         /**Loading extensions to the devices **/
 
-#ifdef WITH_EXTENSIONS
-        /** Loading default extensions **/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-             * cpu_extensions library is compiled from the "extension" folder containing
-             * custom CPU layer implementations.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU extensions are loaded as a shared library and passed as a pointer to the base extension
             IExtensionPtr extension_ptr = make_so_pointer<IExtension>(FLAGS_l.c_str());
@@ -235,15 +221,11 @@ int main(int argc, char *argv[]) {
 
         // --------------- 2. Reading the IR generated by the Model Optimizer (.xml and .bin files) ------------
         slog::info << "Loading network files" << slog::endl;
-        CNNNetReader netReader;
         /** Reading network model **/
-        netReader.ReadNetwork(FLAGS_m);
+        auto cnnNetwork = ie.ReadNetwork(FLAGS_m);
         /** Setting batch size to 1 **/
         slog::info << "Batch size is forced to  1." << slog::endl;
-        netReader.getNetwork().setBatchSize(1);
-        /** Extracting the model name and loading its weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        netReader.ReadWeights(binFileName);
+        cnnNetwork.setBatchSize(1);
         /** Reading labels (if specified) **/
         std::string labelFileName = fileNameNoExt(FLAGS_m) + ".labels";
         std::vector<std::string> labels;
@@ -257,7 +239,7 @@ int main(int argc, char *argv[]) {
         // --------------------------- 3. Configuring input and output -----------------------------------------
         // --------------------------------- Preparing input blobs ---------------------------------------------
         slog::info << "Checking that the inputs are as the demo expects" << slog::endl;
-        InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
         if (inputInfo.size() != 1) {
             throw std::logic_error("This demo accepts networks that have only one input");
         }
@@ -272,7 +254,7 @@ int main(int argc, char *argv[]) {
         }
         // --------------------------------- Preparing output blobs -------------------------------------------
         slog::info << "Checking that the outputs are as the demo expects" << slog::endl;
-        OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        OutputsDataMap outputInfo(cnnNetwork.getOutputsInfo());
         for (auto &output : outputInfo) {
             output.second->setPrecision(Precision::FP32);
             output.second->setLayout(Layout::NCHW);
@@ -281,7 +263,7 @@ int main(int argc, char *argv[]) {
 
         // --------------------------- 4. Loading model to the device ------------------------------------------
         slog::info << "Loading model to the device" << slog::endl;
-        ExecutableNetwork network = ie.LoadNetwork(netReader.getNetwork(), FLAGS_d);
+        ExecutableNetwork network = ie.LoadNetwork(cnnNetwork, FLAGS_d);
 
         // -----------------------------------------------------------------------------------------------------
 
@@ -300,10 +282,12 @@ int main(int argc, char *argv[]) {
         typedef std::chrono::duration<double, std::ratio<1, 1000>> ms;
         auto total_t0 = std::chrono::high_resolution_clock::now();
         auto wallclock = std::chrono::high_resolution_clock::now();
-        double ocv_decode_time = 0, ocv_render_time = 0;
+        double ocv_render_time = 0;
 
         std::cout << "To close the application, press 'CTRL+C' here or switch to the output window and press ESC key" << std::endl;
         std::cout << "To switch between sync/async modes, press TAB key in the output window" << std::endl;
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, static_cast<int>(cap.get(cv::CAP_PROP_FRAME_HEIGHT)) - graphSize.height - 10, graphSize);
         while (true) {
             auto t0 = std::chrono::high_resolution_clock::now();
             // Here is the first asynchronous point:
@@ -327,7 +311,7 @@ int main(int argc, char *argv[]) {
                 FrameToBlob(frame, async_infer_request_curr, inputName);
             }
             auto t1 = std::chrono::high_resolution_clock::now();
-            ocv_decode_time = std::chrono::duration_cast<ms>(t1 - t0).count();
+            double ocv_decode_time = std::chrono::duration_cast<ms>(t1 - t0).count();
 
             t0 = std::chrono::high_resolution_clock::now();
             // Main sync point:
@@ -353,6 +337,7 @@ int main(int argc, char *argv[]) {
                 wallclock = t0;
 
                 t0 = std::chrono::high_resolution_clock::now();
+                presenter.drawGraphs(frame);
                 std::ostringstream out;
                 out << "OpenCV cap/render time: " << std::fixed << std::setprecision(2)
                     << (ocv_decode_time + ocv_render_time) << " ms";
@@ -379,7 +364,7 @@ int main(int argc, char *argv[]) {
                 // Parsing outputs
                 for (auto &output : outputInfo) {
                     auto output_name = output.first;
-                    CNNLayerPtr layer = netReader.getNetwork().getLayerByName(output_name.c_str());
+                    CNNLayerPtr layer = cnnNetwork.getLayerByName(output_name.c_str());
                     Blob::Ptr blob = async_infer_request_curr->GetBlob(output_name);
                     ParseYOLOV3Output(layer, blob, resized_im_h, resized_im_w, height, width, FLAGS_t, objects);
                 }
@@ -446,6 +431,8 @@ int main(int argc, char *argv[]) {
             if (9 == key) {  // Tab
                 isAsyncMode ^= true;
                 isModeChanged = true;
+            } else {
+                presenter.handleKey(key);
             }
         }
         // -----------------------------------------------------------------------------------------------------
@@ -457,6 +444,8 @@ int main(int argc, char *argv[]) {
         if (FLAGS_pc) {
             printPerformanceCounts(*async_infer_request_curr, std::cout, getFullDeviceName(ie, FLAGS_d));
         }
+
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         std::cerr << "[ ERROR ] " << error.what() << std::endl;
diff --git a/demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.hpp b/demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.hpp
index e14fb0d4b08..fed7710ba72 100644
--- a/demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.hpp
+++ b/demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.hpp
@@ -10,89 +10,36 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief Message for images argument
 static const char video_message[] = "Required. Path to a video file (specify \"cam\" to work with camera).";
-
-/// @brief Message for model argument
 static const char model_message[] = "Required. Path to an .xml file with a trained model.";
-
-/// @brief Message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify a target device to infer on (the list of available devices is shown below). " \
-"Default value is CPU. The demo will look for a suitable plugin for the specified device";
-
-/// @brief Message for performance counters
+static const char target_device_message[] = "Optional. Specify a target device to infer on (the list of available devices is shown below). "
+                                            "Default value is CPU. The demo will look for a suitable plugin for the specified device";
 static const char performance_counter_message[] = "Optional. Enable per-layer performance report.";
-
-/// @brief Message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Optional. Required for GPU custom kernels. "\
-"Absolute path to the .xml file with the kernels description.";
-
-/// @brief Message for user library argument
-static const char custom_cpu_library_message[] = "Optional. Required for CPU custom layers. " \
-"Absolute path to a shared library with the layers implementation.";
-
-/// @brief Message for probability threshold argument
+static const char custom_cldnn_message[] = "Optional. Required for GPU custom kernels. "
+                                           "Absolute path to the .xml file with the kernels description.";
+static const char custom_cpu_library_message[] = "Optional. Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the layers implementation.";
 static const char thresh_output_message[] = "Optional. Probability threshold for detections.";
-
-/// @brief Message for probability threshold argument
 static const char iou_thresh_output_message[] = "Optional. Filtering intersection over union threshold for overlapping boxes.";
-
-/// @brief Message raw output flag
 static const char raw_output_message[] = "Optional. Output inference results raw values showing.";
-
-/// @brief Message resizable input flag
 static const char input_resizable_message[] = "Optional. Enable resizable input with support of ROI crop and auto resize.";
-
-/// @brief Message do not show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// \brief Defines flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// \brief Define parameter for set video file of reading from camera <br>
-/// It is a required parameter
 DEFINE_string(i, "", video_message);
-
-/// \brief Defines parameter for setting path to a model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", model_message);
-
-/// \brief Defines the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief Enables per-layer performance report
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief Defines GPU custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Defines absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Defines flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// \brief Defines value of confidence threshold <br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, thresh_output_message);
-
-/// \brief Defines value of intersection over union threshold<br>
-/// It is an optional parameter
 DEFINE_double(iou_t, 0.4, iou_thresh_output_message);
-
-/// \brief Enables resizable input<br>
-/// It is an optional parameter
 DEFINE_bool(auto_resize, false, input_resizable_message);
-
-/// \brief Define a flag to disable showing processed video<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * \brief This function shows a help message
@@ -115,4 +62,5 @@ static void showUsage() {
     std::cout << "    -iou_t                    " << iou_thresh_output_message << std::endl;
     std::cout << "    -auto_resize              " << input_resizable_message << std::endl;
     std::cout << "    -no_show                  " << no_show_processed_video << std::endl;
+    std::cout << "    -u                        " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/pedestrian_tracker_demo/CMakeLists.txt b/demos/pedestrian_tracker_demo/CMakeLists.txt
index 4d20525fc27..6b5a3dc63bd 100644
--- a/demos/pedestrian_tracker_demo/CMakeLists.txt
+++ b/demos/pedestrian_tracker_demo/CMakeLists.txt
@@ -9,4 +9,5 @@ ie_add_sample(NAME pedestrian_tracker_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
               INCLUDE_DIRECTORIES "${CMAKE_CURRENT_SOURCE_DIR}/include"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/pedestrian_tracker_demo/README.md b/demos/pedestrian_tracker_demo/README.md
index ef889f6dfef..7c186ded316 100644
--- a/demos/pedestrian_tracker_demo/README.md
+++ b/demos/pedestrian_tracker_demo/README.md
@@ -27,7 +27,7 @@ After that, the application displays the tracks and the latest detections on the
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./pedestrian_tracker_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -37,7 +37,7 @@ pedestrian_tracker_demo [OPTION]
 Options:
 
     -h                           Print a usage message.
-    -i "<path>"                  Required. Path to a video file or a folder with images (all images should have names 0000000001.jpg, 0000000002.jpg, etc).
+    -i "<path>"                  Required. Video sequence to process.
     -m_det "<path>"              Required. Path to the Pedestrian Detection Retail model (.xml) file.
     -m_reid "<path>"             Required. Path to the Pedestrian Reidentification Retail model (.xml) file.
     -l "<absolute_path>"         Optional. For CPU custom layers, if any. Absolute path to a shared library with the kernels implementation.
@@ -50,8 +50,9 @@ Options:
     -no_show                     Optional. Do not show processed video.
     -delay                       Optional. Delay between frames used for visualization. If negative, the visualization is turned off (like with the option 'no_show'). If zero, the visualization is made frame-by-frame.
     -out "<path>"                Optional. The file name to write output log file with results of pedestrian tracking. The format of the log file is compatible with MOTChallenge format.
-    -first                       Optional. The index of the first frame of video sequence to process. This has effect only if it is positive and the source video sequence is an image folder.
-    -last                        Optional. The index of the last frame of video sequence to process. This has effect only if it is positive and the source video sequence is an image folder.
+    -first                       Optional. The index of the first frame of video sequence to process. This has effect only if it is positive. The actual first frame captured depends on cv::VideoCapture implementation and may have slightly different number.
+    -last                        Optional. The index of the last frame of video sequence to process. This has effect only if it is positive.
+    -u                           Optional. List of monitors to show initially.
 ```
 
 To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
diff --git a/demos/pedestrian_tracker_demo/include/cnn.hpp b/demos/pedestrian_tracker_demo/include/cnn.hpp
index 96d9bbf8507..aa7248808a4 100644
--- a/demos/pedestrian_tracker_demo/include/cnn.hpp
+++ b/demos/pedestrian_tracker_demo/include/cnn.hpp
@@ -18,14 +18,11 @@
  * @brief Base class of config for network
  */
 struct CnnConfig {
-    explicit CnnConfig(const std::string& path_to_model,
-                       const std::string& path_to_weights)
-        : path_to_model(path_to_model), path_to_weights(path_to_weights) {}
+    explicit CnnConfig(const std::string& path_to_model)
+        : path_to_model(path_to_model) {}
 
     /** @brief Path to model description */
     std::string path_to_model;
-    /** @brief Path to model weights */
-    std::string path_to_weights;
     /** @brief Maximal size of batch */
     int max_batch_size{1};
 };
@@ -67,7 +64,7 @@ class CnnBase {
      * @param results_fetcher Callback to fetch inference results
      */
     void Infer(const cv::Mat& frame,
-               std::function<void(const InferenceEngine::BlobMap&, size_t)> results_fetcher) const;
+               const std::function<void(const InferenceEngine::BlobMap&, size_t)>& results_fetcher) const;
 
     /**
      * @brief Run network in batch mode
@@ -76,7 +73,7 @@ class CnnBase {
      * @param results_fetcher Callback to fetch inference results
      */
     void InferBatch(const std::vector<cv::Mat>& frames,
-                    std::function<void(const InferenceEngine::BlobMap&, size_t)> results_fetcher) const;
+                    const std::function<void(const InferenceEngine::BlobMap&, size_t)>& results_fetcher) const;
 
     /** @brief Config */
     Config config_;
diff --git a/demos/pedestrian_tracker_demo/include/core.hpp b/demos/pedestrian_tracker_demo/include/core.hpp
index 8e24370deab..c5d4864a063 100644
--- a/demos/pedestrian_tracker_demo/include/core.hpp
+++ b/demos/pedestrian_tracker_demo/include/core.hpp
@@ -48,8 +48,6 @@ struct TrackedObject {
 
 using TrackedObjects = std::deque<TrackedObject>;
 
-bool operator==(const TrackedObject& first, const TrackedObject& second);
-bool operator!=(const TrackedObject& first, const TrackedObject& second);
 /// (object id, detected objects) pairs collection.
 using ObjectTracks = std::unordered_map<int, TrackedObjects>;
 
diff --git a/demos/pedestrian_tracker_demo/include/detector.hpp b/demos/pedestrian_tracker_demo/include/detector.hpp
index 9b9b690a33b..16ff5998577 100644
--- a/demos/pedestrian_tracker_demo/include/detector.hpp
+++ b/demos/pedestrian_tracker_demo/include/detector.hpp
@@ -15,9 +15,8 @@
 
 
 struct DetectorConfig : public CnnConfig {
-    explicit DetectorConfig(const std::string& path_to_model,
-                            const std::string& path_to_weights)
-        : CnnConfig(path_to_model, path_to_weights) {}
+    explicit DetectorConfig(const std::string& path_to_model)
+        : CnnConfig(path_to_model) {}
 
     float confidence_threshold{0.5f};
     float increase_scale_x{1.f};
diff --git a/demos/pedestrian_tracker_demo/include/image_reader.hpp b/demos/pedestrian_tracker_demo/include/image_reader.hpp
deleted file mode 100644
index 5780ecd5b08..00000000000
--- a/demos/pedestrian_tracker_demo/include/image_reader.hpp
+++ /dev/null
@@ -1,38 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-#include <memory>
-#include <utility>
-#include <string>
-#include <opencv2/core.hpp>
-
-using ImageWithFrameIndex = std::pair<cv::Mat, int>;
-
-class ImageReader {
-public:
-    virtual bool IsOpened() const = 0;
-    virtual void SetFrameIndex(size_t frame_index) = 0;
-    virtual double GetFrameRate() const = 0;
-    virtual int FrameIndex() const = 0;
-    virtual ImageWithFrameIndex Read() = 0;
-
-    virtual ~ImageReader() {}
-
-    /// @brief Create ImageReader to read from a folder with images.
-    static std::unique_ptr<ImageReader> CreateImageReaderForImageFolder(
-        const std::string& folder_path, size_t start_frame_index = 1);
-
-    /// @brief Create ImageReader to read from a video file.
-    static std::unique_ptr<ImageReader> CreateImageReaderForVideoFile(
-        const std::string& file_path);
-
-    /// @brief Create ImageReader to read either from a video file
-    ///        (if the path points to a file) or from a folder with images
-    ///        (if the path points to a folder)
-    static std::unique_ptr<ImageReader> CreateImageReaderForPath(
-        const std::string& path);
-};
-
-
diff --git a/demos/pedestrian_tracker_demo/include/pedestrian_tracker_demo.hpp b/demos/pedestrian_tracker_demo/include/pedestrian_tracker_demo.hpp
index 5273cd08eb7..99ade5e0d60 100644
--- a/demos/pedestrian_tracker_demo/include/pedestrian_tracker_demo.hpp
+++ b/demos/pedestrian_tracker_demo/include/pedestrian_tracker_demo.hpp
@@ -9,117 +9,59 @@
 #include <vector>
 #include <gflags/gflags.h>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
-static const char video_message[] = "Required. Path to a video file or a folder with images "\
-                                     "(all images should have names 0000000001.jpg, 0000000002.jpg, etc).";
-
-/// @brief message for model arguments
+static const char video_message[] = "Required. Video sequence to process.";
 static const char pedestrian_detection_model_message[] = "Required. Path to the Pedestrian Detection Retail model (.xml) file.";
 static const char pedestrian_reid_model_message[] = "Required. Path to the Pedestrian Reidentification Retail model (.xml) file.";
-
-/// @brief message for assigning Pedestrian detection inference to device
-static const char target_device_detection_message[] = "Optional. Specify the target device for pedestrian detection "\
-                                                      "(the list of available devices is shown below). Default value is CPU. " \
+static const char target_device_detection_message[] = "Optional. Specify the target device for pedestrian detection "
+                                                      "(the list of available devices is shown below). Default value is CPU. "
                                                       "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin.";
-
-/// @brief message for assigning Pedestrian Reidentification retail inference to device
-static const char target_device_reid_message[] = "Optional. Specify the target device for pedestrian reidentification "\
-                                                 "(the list of available devices is shown below). Default value is CPU. " \
+static const char target_device_reid_message[] = "Optional. Specify the target device for pedestrian reidentification "
+                                                 "(the list of available devices is shown below). Default value is CPU. "
                                                  "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin.";
-
-/// @brief message for performance counters
 static const char performance_counter_message[] = "Optional. Enable per-layer performance statistics.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Optional. For GPU custom kernels, if any. "\
+static const char custom_cldnn_message[] = "Optional. For GPU custom kernels, if any. "
                                             "Absolute path to the .xml file with the kernels description.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Optional. For CPU custom layers, if any. "\
+static const char custom_cpu_library_message[] = "Optional. For CPU custom layers, if any. "
                                                   "Absolute path to a shared library with the kernels implementation.";
-
-/// @brief message raw output flag
-static const char raw_output_message[] = "Optional. Output pedestrian tracking results in a raw format "\
+static const char raw_output_message[] = "Optional. Output pedestrian tracking results in a raw format "
                                           "(compatible with MOTChallenge format).";
-
-/// @brief message no show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief message for delay between frames
-static const char delay_message[] = "Optional. Delay between frames used for visualization. "\
-                                     "If negative, the visualization is turned off (like with the option 'no_show'). "\
+static const char delay_message[] = "Optional. Delay between frames used for visualization. "
+                                     "If negative, the visualization is turned off (like with the option 'no_show'). "
                                      "If zero, the visualization is made frame-by-frame.";
-
-/// @brief message for output log
-static const char output_log_message[] = "Optional. The file name to write output log file with results of pedestrian tracking. "\
+static const char output_log_message[] = "Optional. The file name to write output log file with results of pedestrian tracking. "
                                           "The format of the log file is compatible with MOTChallenge format.";
+static const char first_frame_message[] = "Optional. The index of the first frame of video sequence to process. "
+                                           "This has effect only if it is positive. The actual first frame captured "
+                                           "depends on cv::VideoCapture implementation and may have slightly different "
+                                           "number.";
+static const char last_frame_message[] = "Optional. The index of the last frame of video sequence to process. "
+                                          "This has effect only if it is positive.";
 
-/// @brief message for the first frame
-static const char first_frame_message[] = "Optional. The index of the first frame of video sequence to process. "\
-                                           "This has effect only if it is positive and the source video sequence is an image folder.";
-/// @brief message for the last frame
-static const char last_frame_message[] = "Optional. The index of the last frame of video sequence to process. "\
-                                          "This has effect only if it is positive and the source video sequence is an image folder.";
+/// @brief Message list of monitors to show
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
 
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "", video_message);
-
-/// @brief Define parameter for pedestrian detection model file <br>
-/// It is a required parameter
 DEFINE_string(m_det, "", pedestrian_detection_model_message);
-
-/// @brief Define parameter for pedestrian reidentification model file <br>
-/// It is a required parameter
 DEFINE_string(m_reid, "", pedestrian_reid_model_message);
-
-/// @brief device the target device for pedestrian detection infer on <br>
 DEFINE_string(d_det, "CPU", target_device_detection_message);
-
-/// @brief device the target device for pedestrian reidentification infer on <br>
 DEFINE_string(d_reid, "CPU", target_device_reid_message);
-
-/// @brief Enable per-layer performance report
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Flag to output pedestrian tracking results in raw format<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// @brief Flag to disable processed video showing<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// @brief Define delay for visualization <br>
-/// It is an optional parameter
 DEFINE_int32(delay, 3, delay_message);
-
-/// @brief Define output log path to store tracking results <br>
-/// It is an optional parameter
 DEFINE_string(out, "", output_log_message);
-
-/// @brief Define the first frame to process <br>
-/// It is an optional parameter
 DEFINE_int32(first, -1, first_frame_message);
+DEFINE_int32(last, -1, last_frame_message);
 
-/// @brief Define the last frame to process <br>
+/// \brief Define a flag to show monitors<br>
 /// It is an optional parameter
-DEFINE_int32(last, -1, last_frame_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 
 /**
@@ -146,4 +88,5 @@ static void showUsage() {
     std::cout << "    -out \"<path>\"                " << output_log_message << std::endl;
     std::cout << "    -first                       " << first_frame_message << std::endl;
     std::cout << "    -last                        " << last_frame_message << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/pedestrian_tracker_demo/include/tracker.hpp b/demos/pedestrian_tracker_demo/include/tracker.hpp
index d78ca09cc6a..9a60426c30a 100644
--- a/demos/pedestrian_tracker_demo/include/tracker.hpp
+++ b/demos/pedestrian_tracker_demo/include/tracker.hpp
@@ -200,12 +200,6 @@ class PedestrianTracker {
     ///
     const TrackerParams &params() const;
 
-    ///
-    /// \brief Pipeline parameters setter.
-    /// \param[in] params Parameters of pipeline.
-    ///
-    void set_params(const TrackerParams &params);
-
     ///
     /// \brief Fast descriptor getter.
     /// \return Fast descriptor used in pipeline.
@@ -254,12 +248,6 @@ class PedestrianTracker {
     ///
     void set_distance_strong(const Distance &val);
 
-    ///
-    /// \brief Returns number of counted people.
-    /// \return a number of counted people.
-    ///
-    size_t Count() const;
-
     ///
     /// \brief Returns a detection log which is used for tracks saving.
     /// \param[in] valid_only If it is true the method returns valid track only.
@@ -286,13 +274,6 @@ class PedestrianTracker {
     ///
     cv::Mat DrawActiveTracks(const cv::Mat &frame);
 
-    ///
-    /// \brief Print confusion matrices of data association classifiers.
-    /// It works only in case of loaded detection logs instead of native
-    /// detectors.
-    ///
-    void PrintConfusionMatrices() const;
-
     ///
     /// \brief IsTrackForgotten returns true if track is forgotten.
     /// \param id Track ID.
@@ -320,13 +301,6 @@ class PedestrianTracker {
     ///
     void DropForgottenTracks();
 
-    ///
-    /// \brief DropForgottenTracks Check that the track was lost too many frames
-    /// ago
-    /// and removes it frm memory.
-    ///
-    void DropForgottenTrack(size_t track_id);
-
     ///
     /// \brief Prints reid performance counter
     ///
@@ -434,22 +408,8 @@ class PedestrianTracker {
 
     void UpdateLostTracks(const std::set<size_t> &track_ids);
 
-    static cv::Mat ConfusionMatrix(const std::vector<Match> &matches);
-
     const std::set<size_t> &active_track_ids() const;
 
-    // Returns decisions made by heuristic based on fast distance/descriptor and
-    // shape, motion and time affinity.
-    const std::vector<Match> & base_classifier_matches() const;
-
-    // Returns decisions made by heuristic based on strong distance/descriptor
-    // and
-    // shape, motion and time affinity.
-    const std::vector<Match> &reid_based_classifier_matches() const;
-
-    // Returns decisions made by strong distance/descriptor affinity.
-    const std::vector<Match> &reid_classifier_matches() const;
-
     TrackedObjects FilterDetections(const TrackedObjects &detections) const;
     bool IsTrackForgotten(const Track &track) const;
 
@@ -487,30 +447,9 @@ class PedestrianTracker {
     // Distance between current active tracks.
     std::unordered_map<std::pair<size_t, size_t>, float, pair_hash> tracks_dists_;
 
-    // Whether collect matches and compute confusion matrices for
-    // track-detection
-    // association task (base classifier, reid-based classifier,
-    // reid-classiifer).
-    bool collect_matches_;
-
-    // This vector contains decisions made by
-    // fast_apperance-motion-shape affinity model.
-    std::vector<Match> base_classifier_matches_;
-
-    // This vector contains decisions made by
-    // strong_apperance(cnn-reid)-motion-shape affinity model.
-    std::vector<Match> reid_based_classifier_matches_;
-
-    // This vector contains decisions made by
-    // strong_apperance(cnn-reid) affinity model only.
-    std::vector<Match> reid_classifier_matches_;
-
     // Number of all current tracks.
     size_t tracks_counter_;
 
-    // Number of dropped valid tracks.
-    size_t valid_tracks_counter_;
-
     cv::Size frame_size_;
 
     std::vector<cv::Scalar> colors_;
diff --git a/demos/pedestrian_tracker_demo/main.cpp b/demos/pedestrian_tracker_demo/main.cpp
index 703017f9657..69f7d3f55e5 100644
--- a/demos/pedestrian_tracker_demo/main.cpp
+++ b/demos/pedestrian_tracker_demo/main.cpp
@@ -8,9 +8,10 @@
 #include "descriptor.hpp"
 #include "distance.hpp"
 #include "detector.hpp"
-#include "image_reader.hpp"
 #include "pedestrian_tracker_demo.hpp"
 
+#include <monitors/presenter.h>
+
 #include <opencv2/core.hpp>
 
 #include <iostream>
@@ -26,7 +27,6 @@ using ImageWithFrameIndex = std::pair<cv::Mat, int>;
 
 std::unique_ptr<PedestrianTracker>
 CreatePedestrianTracker(const std::string& reid_model,
-                        const std::string& reid_weights,
                         const InferenceEngine::Core & ie,
                         const std::string & deviceName,
                         bool should_keep_tracking_info) {
@@ -49,9 +49,9 @@ CreatePedestrianTracker(const std::string& reid_model,
     tracker->set_descriptor_fast(descriptor_fast);
     tracker->set_distance_fast(distance_fast);
 
-    if (!reid_model.empty() && !reid_weights.empty()) {
-        CnnConfig reid_config(reid_model, reid_weights);
-        reid_config.max_batch_size = 16;
+    if (!reid_model.empty()) {
+        CnnConfig reid_config(reid_model);
+        reid_config.max_batch_size = 16;   // defaulting to 16
 
         std::shared_ptr<IImageDescriptor> descriptor_strong =
             std::make_shared<DescriptorIE>(reid_config, ie, deviceName);
@@ -65,8 +65,8 @@ CreatePedestrianTracker(const std::string& reid_model,
         tracker->set_descriptor_strong(descriptor_strong);
         tracker->set_distance_strong(distance_strong);
     } else {
-        std::cout << "WARNING: Either reid model or reid weights "
-            << "were not specified. "
+        std::cout << "WARNING: Reid model "
+            << "was not specified. "
             << "Only fast reidentification approach will be used." << std::endl;
     }
 
@@ -83,8 +83,6 @@ bool ParseAndCheckCommandLine(int argc, char *argv[]) {
         return false;
     }
 
-    std::cout << "Parsing input parameters" << std::endl;
-
     if (FLAGS_i.empty()) {
         throw std::logic_error("Parameter -i is not set");
     }
@@ -109,13 +107,8 @@ int main_work(int argc, char **argv) {
 
 
     // Reading command line parameters.
-    auto video_path = FLAGS_i;
-
     auto det_model = FLAGS_m_det;
-    auto det_weights = fileNameNoExt(FLAGS_m_det) + ".bin";
-
     auto reid_model = FLAGS_m_reid;
-    auto reid_weights = fileNameNoExt(FLAGS_m_reid) + ".bin";
 
     auto detlog_out = FLAGS_out;
 
@@ -134,15 +127,12 @@ int main_work(int argc, char **argv) {
         delay = -1;
     should_show = (delay >= 0);
 
-    int first_frame = FLAGS_first;
-    int last_frame = FLAGS_last;
-
     bool should_save_det_log = !detlog_out.empty();
 
-    if (first_frame >= 0)
-        std::cout << "first_frame = " << first_frame << std::endl;
-    if (last_frame >= 0)
-        std::cout << "last_frame = " << last_frame << std::endl;
+    if ((FLAGS_last >= 0) && (FLAGS_first > FLAGS_last)) {
+        throw std::runtime_error("The first frame index (" + std::to_string(FLAGS_first) + ") must be greater than the "
+            "last frame index (" + std::to_string(FLAGS_last) + ')');
+    }
 
     std::vector<std::string> devices{detector_mode, reid_mode};
     InferenceEngine::Core ie =
@@ -150,24 +140,37 @@ int main_work(int argc, char **argv) {
             devices, custom_cpu_library, path_to_custom_layers,
             should_use_perf_counter);
 
-    DetectorConfig detector_confid(det_model, det_weights);
+    DetectorConfig detector_confid(det_model);
     ObjectDetector pedestrian_detector(detector_confid, ie, detector_mode);
 
     bool should_keep_tracking_info = should_save_det_log || should_print_out;
     std::unique_ptr<PedestrianTracker> tracker =
-        CreatePedestrianTracker(reid_model, reid_weights, ie, reid_mode,
+        CreatePedestrianTracker(reid_model, ie, reid_mode,
                                 should_keep_tracking_info);
 
-
-    // Opening video.
-    std::unique_ptr<ImageReader> video =
-        ImageReader::CreateImageReaderForPath(video_path);
-
-    PT_CHECK(video->IsOpened()) << "Failed to open video: " << video_path;
-    double video_fps = video->GetFrameRate();
-
-    if (first_frame > 0)
-        video->SetFrameIndex(first_frame);
+    cv::VideoCapture cap;
+    try {
+        int intInput = std::stoi(FLAGS_i);
+        if (!cap.open(intInput)) {
+            throw std::runtime_error("Can't open " + std::to_string(intInput));
+        }
+    } catch (const std::invalid_argument&) {
+        if (!cap.open(FLAGS_i)) {
+            throw std::runtime_error("Can't open " + FLAGS_i);
+        }
+    } catch (const std::out_of_range&) {
+        if (!cap.open(FLAGS_i)) {
+            throw std::runtime_error("Can't open " + FLAGS_i);
+        }
+    }
+    double video_fps = cap.get(cv::CAP_PROP_FPS);
+    if (0.0 == video_fps) {
+        // the default frame rate for DukeMTMC dataset
+        video_fps = 60.0;
+    }
+    if (0 >= FLAGS_first && !cap.set(cv::CAP_PROP_POS_FRAMES, FLAGS_first)) {
+        throw std::runtime_error("Can't set the frame to begin with");
+    }
 
     std::cout << "To close the application, press 'CTRL+C' here";
     if (!FLAGS_no_show) {
@@ -175,18 +178,12 @@ int main_work(int argc, char **argv) {
     }
     std::cout << std::endl;
 
-    for (;;) {
-        auto pair = video->Read();
-        cv::Mat frame = pair.first;
-        int frame_idx = pair.second;
-
-        if (frame.empty()) break;
-
-        PT_CHECK(frame_idx >= first_frame);
+    cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+    Presenter presenter(FLAGS_u, 10, graphSize);
 
-        if ( (last_frame >= 0) && (frame_idx > last_frame) ) {
-            std::cout << "Frame " << frame_idx << " is greater than last_frame = "
-                << last_frame << " -- break";
+    for (int32_t frame_idx = std::max(0, FLAGS_first); 0 > FLAGS_last || frame_idx <= FLAGS_last; ++frame_idx) {
+        cv::Mat frame;
+        if (!cap.read(frame)) {
             break;
         }
 
@@ -199,6 +196,8 @@ int main_work(int argc, char **argv) {
         uint64_t cur_timestamp = static_cast<uint64_t >(1000.0 / video_fps * frame_idx);
         tracker->Process(frame, detections, cur_timestamp);
 
+        presenter.drawGraphs(frame);
+
         if (should_show) {
             // Drawing colored "worms" (tracks).
             frame = tracker->DrawActiveTracks(frame);
@@ -223,6 +222,7 @@ int main_work(int argc, char **argv) {
             char k = cv::waitKey(delay);
             if (k == 27)
                 break;
+            presenter.handleKey(k);
         }
 
         if (should_save_det_log && (frame_idx % 100 == 0)) {
@@ -243,6 +243,8 @@ int main_work(int argc, char **argv) {
         pedestrian_detector.PrintPerformanceCounts(getFullDeviceName(ie, FLAGS_d_det));
         tracker->PrintReidPerformanceCounts(getFullDeviceName(ie, FLAGS_d_reid));
     }
+
+    std::cout << presenter.reportMeans() << '\n';
     return 0;
 }
 
diff --git a/demos/pedestrian_tracker_demo/src/cnn.cpp b/demos/pedestrian_tracker_demo/src/cnn.cpp
index 5056c0531e5..995f3bf4550 100644
--- a/demos/pedestrian_tracker_demo/src/cnn.cpp
+++ b/demos/pedestrian_tracker_demo/src/cnn.cpp
@@ -23,20 +23,14 @@ CnnBase::CnnBase(const Config& config,
     config_(config), ie_(ie), deviceName_(deviceName) {}
 
 void CnnBase::Load() {
-    CNNNetReader net_reader;
-    net_reader.ReadNetwork(config_.path_to_model);
-    net_reader.ReadWeights(config_.path_to_weights);
+    auto cnnNetwork = ie_.ReadNetwork(config_.path_to_model);
 
-    if (!net_reader.isParseSuccess()) {
-        THROW_IE_EXCEPTION << "Cannot load model";
-    }
-
-    const int currentBatchSize = net_reader.getNetwork().getBatchSize();
+    const int currentBatchSize = cnnNetwork.getBatchSize();
     if (currentBatchSize != config_.max_batch_size)
-        net_reader.getNetwork().setBatchSize(config_.max_batch_size);
+        cnnNetwork.setBatchSize(config_.max_batch_size);
 
     InferenceEngine::InputsDataMap in;
-    in = net_reader.getNetwork().getInputsInfo();
+    in = cnnNetwork.getInputsInfo();
     if (in.size() != 1) {
         THROW_IE_EXCEPTION << "Network should have only one input";
     }
@@ -47,7 +41,7 @@ void CnnBase::Load() {
     input_blob_->allocate();
     BlobMap inputs;
     inputs[in.begin()->first] = input_blob_;
-    outInfo_ = net_reader.getNetwork().getOutputsInfo();
+    outInfo_ = cnnNetwork.getOutputsInfo();
 
     for (auto&& item : outInfo_) {
         SizeVector outputDims = item.second->getTensorDesc().getDims();
@@ -59,7 +53,7 @@ void CnnBase::Load() {
         outputs_[item.first] = output;
     }
 
-    executable_network_ = ie_.LoadNetwork(net_reader.getNetwork(), deviceName_);
+    executable_network_ = ie_.LoadNetwork(cnnNetwork, deviceName_);
     infer_request_ = executable_network_.CreateInferRequest();
     infer_request_.SetInput(inputs);
     infer_request_.SetOutput(outputs_);
@@ -67,7 +61,7 @@ void CnnBase::Load() {
 
 void CnnBase::InferBatch(
     const std::vector<cv::Mat>& frames,
-    std::function<void(const InferenceEngine::BlobMap&, size_t)> fetch_results) const {
+    const std::function<void(const InferenceEngine::BlobMap&, size_t)>& fetch_results) const {
     const size_t batch_size = input_blob_->getTensorDesc().getDims()[0];
 
     size_t num_imgs = frames.size();
@@ -77,7 +71,6 @@ void CnnBase::InferBatch(
             matU8ToBlob<uint8_t>(frames[batch_i + b], input_blob_, b);
         }
 
-        infer_request_.SetBatch(current_batch_size);
         infer_request_.Infer();
 
         fetch_results(outputs_, current_batch_size);
@@ -90,7 +83,7 @@ void CnnBase::PrintPerformanceCounts(std::string fullDeviceName) const {
 }
 
 void CnnBase::Infer(const cv::Mat& frame,
-                    std::function<void(const InferenceEngine::BlobMap&, size_t)> fetch_results) const {
+                    const std::function<void(const InferenceEngine::BlobMap&, size_t)>& fetch_results) const {
     InferBatch({frame}, fetch_results);
 }
 
diff --git a/demos/pedestrian_tracker_demo/src/core.cpp b/demos/pedestrian_tracker_demo/src/core.cpp
deleted file mode 100644
index d135f8a7d64..00000000000
--- a/demos/pedestrian_tracker_demo/src/core.cpp
+++ /dev/null
@@ -1,19 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "core.hpp"
-
-#include <iostream>
-
-bool operator==(const TrackedObject& first, const TrackedObject& second) {
-    return ( (first.rect == second.rect)
-            && (first.confidence == second.confidence)
-            && (first.frame_idx == second.frame_idx)
-            && (first.object_id == second.object_id)
-            && (first.timestamp == second.timestamp) );
-}
-
-bool operator!=(const TrackedObject& first, const TrackedObject& second) {
-    return !(first == second);
-}
diff --git a/demos/pedestrian_tracker_demo/src/detector.cpp b/demos/pedestrian_tracker_demo/src/detector.cpp
index 5e8584602d9..97accfa9fa6 100644
--- a/demos/pedestrian_tracker_demo/src/detector.cpp
+++ b/demos/pedestrian_tracker_demo/src/detector.cpp
@@ -98,14 +98,9 @@ ObjectDetector::ObjectDetector(
     config_(config),
     ie_(ie),
     deviceName_(deviceName) {
-    CNNNetReader net_reader;
-    net_reader.ReadNetwork(config.path_to_model);
-    net_reader.ReadWeights(config.path_to_weights);
-    if (!net_reader.isParseSuccess()) {
-        THROW_IE_EXCEPTION << "Cannot load model";
-    }
+    auto cnnNetwork = ie_.ReadNetwork(config.path_to_model);
 
-    InputsDataMap inputInfo(net_reader.getNetwork().getInputsInfo());
+    InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
     if (1 == inputInfo.size() || 2 == inputInfo.size()) {
         for (const std::pair<std::string, InputInfo::Ptr>& input : inputInfo) {
             InputInfo::Ptr inputInfo = input.second;
@@ -130,14 +125,14 @@ ObjectDetector::ObjectDetector(
     inputInfoFirst->setPrecision(Precision::U8);
     inputInfoFirst->getInputData()->setLayout(Layout::NCHW);
 
-    OutputsDataMap outputInfo(net_reader.getNetwork().getOutputsInfo());
+    OutputsDataMap outputInfo(cnnNetwork.getOutputsInfo());
     if (outputInfo.size() != 1) {
         THROW_IE_EXCEPTION << "Person Detection network should have only one output";
     }
     DataPtr& _output = outputInfo.begin()->second;
     output_name_ = outputInfo.begin()->first;
 
-    const CNNLayerPtr outputLayer = net_reader.getNetwork().getLayerByName(output_name_.c_str());
+    const CNNLayerPtr outputLayer = cnnNetwork.getLayerByName(output_name_.c_str());
     if (outputLayer->type != "DetectionOutput") {
         THROW_IE_EXCEPTION << "Person Detection network output layer(" + outputLayer->name +
             ") should be DetectionOutput, but was " +  outputLayer->type;
@@ -161,7 +156,7 @@ ObjectDetector::ObjectDetector(
     _output->setPrecision(Precision::FP32);
     _output->setLayout(TensorDesc::getLayoutByDims(_output->getDims()));
 
-    net_ = ie_.LoadNetwork(net_reader.getNetwork(), deviceName_);
+    net_ = ie_.LoadNetwork(cnnNetwork, deviceName_);
 }
 
 void ObjectDetector::wait() {
diff --git a/demos/pedestrian_tracker_demo/src/image_reader.cpp b/demos/pedestrian_tracker_demo/src/image_reader.cpp
deleted file mode 100644
index ca2e61cd19d..00000000000
--- a/demos/pedestrian_tracker_demo/src/image_reader.cpp
+++ /dev/null
@@ -1,145 +0,0 @@
-// Copyright (C) 2018-2019 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include "image_reader.hpp"
-#include <details/ie_exception.hpp>
-#include <iomanip>
-#include <string>
-#include <memory>
-#include <sstream>
-#include <sys/types.h>
-#include <sys/stat.h>
-#include <opencv2/highgui.hpp>
-#include <opencv2/videoio.hpp>
-
-namespace {
-bool IsFolder(const std::string& folder_path) {
-    struct stat folder_info;
-    if ( stat( folder_path.c_str(), &folder_info ) != 0 )
-        return false;
-    if ( folder_info.st_mode & S_IFDIR )
-        return true;
-    return false;
-}
-bool IsFile(const std::string& path) {
-    struct stat info;
-    if ( stat( path.c_str(), &info ) != 0 )
-        return false;
-    if ( info.st_mode & S_IFREG )
-        return true;
-    return false;
-}
-}  // anonymous namespace
-
-class ImageReaderForFolder: public ImageReader {
-public:
-    ImageReaderForFolder(const std::string& folder_path, size_t start_frame_index) {
-        folder_path_ = folder_path;
-        frame_index_ = start_frame_index;
-    }
-
-    bool IsOpened() const {
-        return IsFolder(folder_path_);
-    }
-    void SetFrameIndex(size_t frame_index) {
-        frame_index_ = frame_index;
-    }
-
-    int FrameIndex() const {
-        return frame_index_;
-    }
-
-    ImageWithFrameIndex Read() {
-        auto path = GetImagePath(folder_path_, frame_index_);
-        cv::Mat img = cv::imread(path);
-
-        ImageWithFrameIndex result;
-        result.first = img;
-        result.second = frame_index_;
-
-        frame_index_++;
-        return result;
-    }
-
-    // Note that for images folder
-    // the default frame rate for DukeMTMC dataset is returned
-    double GetFrameRate() const {return 60.0;}
-
-private:
-    std::string folder_path_;
-    size_t frame_index_ = 1;
-
-    static std::string GetImagePath(const std::string& folder_path,
-                                    size_t frame_index) {
-        std::stringstream strstr;
-        strstr << folder_path << "/"
-            << std::internal
-            << std::setfill('0')
-            << std::setw(10)
-            << frame_index
-            << ".jpg";
-        return strstr.str();
-    }
-};
-
-class ImageReaderForVideoFile: public ImageReader {
-public:
-    explicit ImageReaderForVideoFile(const std::string& file_path)
-        : video_capture(file_path) {}
-
-    bool IsOpened() const {
-        return video_capture.isOpened();
-    }
-    void SetFrameIndex(size_t frame_index) {
-        THROW_IE_EXCEPTION << "ImageReader does not set frame index in video, "
-            << "since in the current implementation it is not precise";
-    }
-
-    int FrameIndex() const {
-        return frame_index_;
-    }
-
-    ImageWithFrameIndex Read() {
-        ImageWithFrameIndex result;
-        video_capture >> result.first;
-        result.second = frame_index_;
-        frame_index_++;
-        return result;
-    }
-
-    double GetFrameRate() const {
-        double video_fps = video_capture.get(cv::CAP_PROP_FPS);
-        if ((video_fps <= 0) || (video_fps > 200)) {
-            video_fps = 30;
-        }
-        return video_fps;
-    }
-
-private:
-    size_t frame_index_ = 1;
-    cv::VideoCapture video_capture;
-};
-
-std::unique_ptr<ImageReader> ImageReader::CreateImageReaderForImageFolder(
-    const std::string& folder_path, size_t start_frame_index) {
-    return std::unique_ptr<ImageReader>(
-        new ImageReaderForFolder(folder_path, start_frame_index));
-}
-
-std::unique_ptr<ImageReader> ImageReader::CreateImageReaderForVideoFile(
-    const std::string& file_path) {
-    return std::unique_ptr<ImageReader>(
-        new ImageReaderForVideoFile(file_path));
-}
-
-std::unique_ptr<ImageReader> ImageReader::CreateImageReaderForPath(
-    const std::string& path) {
-    if (IsFolder(path))
-        return ImageReader::CreateImageReaderForImageFolder(path);
-
-    if (IsFile(path))
-        return ImageReader::CreateImageReaderForVideoFile(path);
-
-    return std::unique_ptr<ImageReader>();
-}
diff --git a/demos/pedestrian_tracker_demo/src/tracker.cpp b/demos/pedestrian_tracker_demo/src/tracker.cpp
index b40ff3b0c0e..5eb235eabbb 100644
--- a/demos/pedestrian_tracker_demo/src/tracker.cpp
+++ b/demos/pedestrian_tracker_demo/src/tracker.cpp
@@ -141,26 +141,11 @@ void ValidateParams(const TrackerParams &p) {
     }
 }
 
-// Returns confusion matrix as:
-//   |tp fn|
-//   |fp tn|
-cv::Mat PedestrianTracker::ConfusionMatrix(const std::vector<Match> &matches) {
-    const bool kNegative = false;
-    cv::Mat conf_mat(2, 2, CV_32F, cv::Scalar(0));
-    for (const auto &m : matches) {
-        conf_mat.at<float>(m.gt_label == kNegative, m.pr_label == kNegative)++;
-    }
-
-    return conf_mat;
-}
-
 PedestrianTracker::PedestrianTracker(const TrackerParams &params)
     : params_(params),
     descriptor_strong_(nullptr),
     distance_strong_(nullptr),
-    collect_matches_(true),
     tracks_counter_(0),
-    valid_tracks_counter_(0),
     frame_size_(0, 0),
     prev_timestamp_(std::numeric_limits<uint64_t>::max()) {
         ValidateParams(params);
@@ -169,12 +154,6 @@ PedestrianTracker::PedestrianTracker(const TrackerParams &params)
 // Pipeline parameters getter.
 const TrackerParams &PedestrianTracker::params() const { return params_; }
 
-// Pipeline parameters setter.
-void PedestrianTracker::set_params(const TrackerParams &params) {
-    ValidateParams(params);
-    params_ = params;
-}
-
 // Descriptor fast getter.
 const PedestrianTracker::Descriptor &PedestrianTracker::descriptor_fast() const {
     return descriptor_fast_;
@@ -224,25 +203,6 @@ DetectionLog PedestrianTracker::GetDetectionLog(const bool valid_only) const {
     return ConvertTracksToDetectionLog(all_tracks(valid_only));
 }
 
-// Returns decisions made by heuristic based on fast distance/descriptor and
-// shape, motion and time affinity.
-const std::vector<PedestrianTracker::Match> &
-PedestrianTracker::base_classifier_matches() const {
-    return base_classifier_matches_;
-}
-
-// Returns decisions made by heuristic based on strong distance/descriptor
-// and
-// shape, motion and time affinity.
-const std::vector<PedestrianTracker::Match> &PedestrianTracker::reid_based_classifier_matches() const {
-    return reid_based_classifier_matches_;
-}
-
-// Returns decisions made by strong distance/descriptor affinity.
-const std::vector<PedestrianTracker::Match> &PedestrianTracker::reid_classifier_matches() const {
-    return reid_classifier_matches_;
-}
-
 TrackedObjects PedestrianTracker::FilterDetections(
     const TrackedObjects &detections) const {
     TrackedObjects filtered_detections;
@@ -458,13 +418,6 @@ void PedestrianTracker::Process(const cv::Mat &frame,
             auto last_det = tracks_.at(track_id).objects.back();
             last_det.rect = tracks_.at(track_id).predicted_rect;
 
-            if (collect_matches_ && last_det.object_id >= 0 &&
-                detections[det_id].object_id >= 0) {
-                base_classifier_matches_.emplace_back(
-                    tracks_.at(track_id).objects.back(), last_det.rect,
-                    detections[det_id], conf > params_.aff_thr_fast);
-            }
-
             if (conf > params_.aff_thr_fast) {
                 AppendToTrack(frame, track_id, detections[det_id],
                               descriptors_fast[det_id], cv::Mat());
@@ -527,11 +480,6 @@ void PedestrianTracker::DropForgottenTracks() {
             new_tracks.emplace(reassign_id ? counter : pair.first, pair.second);
             new_active_tracks.emplace(reassign_id ? counter : pair.first);
             counter++;
-
-        } else {
-            if (IsTrackValid(pair.first)) {
-                valid_tracks_counter_++;
-            }
         }
     }
     tracks_.swap(new_tracks);
@@ -540,12 +488,6 @@ void PedestrianTracker::DropForgottenTracks() {
     tracks_counter_ = reassign_id ? counter : tracks_counter_;
 }
 
-void PedestrianTracker::DropForgottenTrack(size_t track_id) {
-    PT_CHECK(IsTrackForgotten(track_id));
-    PT_CHECK(active_track_ids_.count(track_id) == 0);
-    tracks_.erase(track_id);
-}
-
 float PedestrianTracker::ShapeAffinity(float weight, const cv::Rect &trk,
                                        const cv::Rect &det) {
     float w_dist = static_cast<float>(std::abs(trk.width - det.width) / (trk.width + det.width));
@@ -691,17 +633,6 @@ PedestrianTracker::StrongMatching(
 
         float affinity = static_cast<float>(reid_affinity) * Affinity(last_det, detection);
 
-        if (collect_matches_ && last_det.object_id >= 0 &&
-            detection.object_id >= 0) {
-            reid_classifier_matches_.emplace_back(track.objects.back(), last_det.rect,
-                                                  detection,
-                                                  reid_affinity > params_.reid_thr);
-
-            reid_based_classifier_matches_.emplace_back(
-                track.objects.back(), last_det.rect, detection,
-                affinity > params_.aff_thr_strong);
-        }
-
         bool is_detection_matching =
             reid_affinity > params_.reid_thr && affinity > params_.aff_thr_strong;
 
@@ -835,14 +766,6 @@ bool PedestrianTracker::IsTrackForgotten(const Track &track) const {
     return (track.lost > params_.forget_delay);
 }
 
-size_t PedestrianTracker::Count() const {
-    size_t count = valid_tracks_counter_;
-    for (const auto &pair : tracks_) {
-        count += (IsTrackValid(pair.first) ? 1 : 0);
-    }
-    return count;
-}
-
 std::unordered_map<size_t, std::vector<cv::Point>>
 PedestrianTracker::GetActiveTracks() const {
     std::unordered_map<size_t, std::vector<cv::Point>> active_tracks;
@@ -893,41 +816,6 @@ cv::Mat PedestrianTracker::DrawActiveTracks(const cv::Mat &frame) {
     return out_frame;
 }
 
-const cv::Size kMinFrameSize = cv::Size(320, 240);
-const cv::Size kMaxFrameSize = cv::Size(1920, 1080);
-
-void PedestrianTracker::PrintConfusionMatrices() const {
-    std::cout << "Base classifier quality: " << std::endl;
-    {
-        auto cm = ConfusionMatrix(base_classifier_matches());
-        std::cout << cm << std::endl;
-        std::cout << "or" << std::endl;
-        cm.row(0) = cm.row(0) / std::max(1.0, cv::sum(cm.row(0))[0]);
-        cm.row(1) = cm.row(1) / std::max(1.0, cv::sum(cm.row(1))[0]);
-        std::cout << cm << std::endl << std::endl;
-    }
-
-    std::cout << "Reid-based classifier quality: " << std::endl;
-    {
-        auto cm = ConfusionMatrix(reid_based_classifier_matches());
-        std::cout << cm << std::endl;
-        std::cout << "or" << std::endl;
-        cm.row(0) = cm.row(0) / std::max(1.0, cv::sum(cm.row(0))[0]);
-        cm.row(1) = cm.row(1) / std::max(1.0, cv::sum(cm.row(1))[0]);
-        std::cout << cm << std::endl << std::endl;
-    }
-
-    std::cout << "Reid only classifier quality: " << std::endl;
-    {
-        auto cm = ConfusionMatrix(reid_classifier_matches());
-        std::cout << cm << std::endl;
-        std::cout << "or" << std::endl;
-        cm.row(0) = cm.row(0) / std::max(1.0, cv::sum(cm.row(0))[0]);
-        cm.row(1) = cm.row(1) / std::max(1.0, cv::sum(cm.row(1))[0]);
-        std::cout << cm << std::endl << std::endl;
-    }
-}
-
 void PedestrianTracker::PrintReidPerformanceCounts(std::string fullDeviceName) const {
     if (descriptor_strong_) {
         descriptor_strong_->PrintPerformanceCounts(fullDeviceName);
diff --git a/demos/pedestrian_tracker_demo/src/utils.cpp b/demos/pedestrian_tracker_demo/src/utils.cpp
index 0b8fda2cb72..ab281de99ec 100644
--- a/demos/pedestrian_tracker_demo/src/utils.cpp
+++ b/demos/pedestrian_tracker_demo/src/utils.cpp
@@ -14,9 +14,6 @@
 #include <string>
 #include <set>
 #include <memory>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 using namespace InferenceEngine;
 
@@ -85,9 +82,6 @@ LoadInferenceEngine(const std::vector<std::string>& devices,
 
         /** Load extensions for the CPU device **/
         if ((device.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
             if (!custom_cpu_library.empty()) {
                 // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
                 auto extension_ptr = make_so_pointer<IExtension>(custom_cpu_library);
@@ -98,12 +92,6 @@ LoadInferenceEngine(const std::vector<std::string>& devices,
             ie.SetConfig({{PluginConfigParams::KEY_CONFIG_FILE, custom_cldnn_kernels}}, "GPU");
         }
 
-        if (device.find("CPU") != std::string::npos) {
-            ie.SetConfig({{PluginConfigParams::KEY_DYN_BATCH_ENABLED, PluginConfigParams::YES}}, "CPU");
-        } else if (device.find("GPU") != std::string::npos) {
-            ie.SetConfig({{PluginConfigParams::KEY_DYN_BATCH_ENABLED, PluginConfigParams::YES}}, "GPU");
-        }
-
         if (should_use_perf_counter)
             ie.SetConfig({{PluginConfigParams::KEY_PERF_COUNT, PluginConfigParams::YES}});
 
diff --git a/demos/python_demos/3d_segmentation_demo/3d_segmentation_demo.py b/demos/python_demos/3d_segmentation_demo/3d_segmentation_demo.py
index e0bb1a185be..34cda6307ac 100755
--- a/demos/python_demos/3d_segmentation_demo/3d_segmentation_demo.py
+++ b/demos/python_demos/3d_segmentation_demo/3d_segmentation_demo.py
@@ -67,12 +67,29 @@
 # file suffixes to form a data tensor
 DATA_SUFFIXES = [SUFFIX_T1, SUFFIX_T2, SUFFIX_FLAIR, SUFFIX_T1CE]
 
+NIFTI_FOLDER = 0
+NIFTI_FILE = 1
+TIFF_FILE = 2
+
+
+def mri_sequence(arg):
+    sequence = tuple(int(k) for k in arg.split(','))
+    if len(sequence) != 4:
+        raise AttributeError("The MRI-sequence should contain exactly 4 values, but contains {}.".format(len(sequence)))
+    if len(set(sequence)) != 4:
+        raise AttributeError("The MRI-sequence has repeating scan types - {}. "
+                             "The MRI-sequence must contain native T1, native T2, T2-FLAIR, "
+                             "post-Gadolinium contrast T1 scans in the specific for the net order".
+                             format(sequence))
+    return sequence
+
+
 def parse_arguments():
     parser = ArgumentParser(add_help=False)
     args = parser.add_argument_group('Options')
     args.add_argument('-h', '--help', action='help', default=SUPPRESS, help='Show this help message and exit.')
     args.add_argument('-i', '--path_to_input_data', type=str, required=True,
-                        help="Required. Path to an input folder with NIfTI data/TIFF file")
+                        help="Required. Path to an input folder with NIfTI data/NIFTI file/TIFF file")
     args.add_argument('-m', '--path_to_model', type=str, required=True,
                         help="Required. Path to an .xml file with a trained model")
     args.add_argument('-o', '--path_to_output', type=str, required=True,
@@ -92,9 +109,25 @@ def parse_arguments():
     args.add_argument('-c', '--path_to_cldnn_config', type=str, required=False,
                         help="Required for GPU custom kernels. "
                              "Absolute path to an .xml file with the kernels description.")
+    args.add_argument('-ms', '--mri_sequence', type=mri_sequence, metavar='N1,N2,N3,N4', default=(0,1,2,3),
+                      help='Optional. Transfer MRI-sequence from dataset order to the network order.')
+    args.add_argument("--full_intensities_range", required=False, default=False, action="store_true",
+                      help="Take intensities of the input image in a full range.")
     return parser.parse_args()
 
 
+def get_input_type(path):
+    if os.path.isdir(path):
+        return NIFTI_FOLDER
+    elif fnmatch(path, '*.nii.gz') or fnmatch(path, '*.nii'):
+        return NIFTI_FILE
+    elif fnmatch(path, '*.tif') or fnmatch(path, '*.tiff'):
+        return TIFF_FILE
+
+    raise RuntimeError("Input must be a folder with 4 NIFTI files, single NIFTI file (*.nii or *.nii.gz) or "
+                         "TIFF file (*.tif or *.tiff)")
+
+
 def find_series_name(path):
     for file in os.listdir(path):
         if fnmatch(file, '*.nii.gz'):
@@ -125,25 +158,24 @@ def bbox3(img):
     return np.array([[-1, -1, -1], [0, 0, 0]])
 
 
-def read_nii_header(data_path, series_name, suffix, separate_folder=True):
-    filename = os.path.join(data_path, series_name, series_name + suffix)
-    if not separate_folder:
-        filename = os.path.join(data_path, series_name + suffix)
+def read_nii_header(data_path, name):
+    filename = os.path.join(data_path, name)
     if not os.path.exists(filename):
-        raise AttributeError("File {} is not exist. Please, validate path to input".format(filename))
+        raise ValueError("File {} is not exist. Please, validate path to input".format(filename))
     return nib.load(filename)
 
 
-def normalize(image, mask):
+def normalize(image, mask, full_intensities_range):
     ret = image.copy()
     image_masked = np.ma.masked_array(ret, ~(mask))
-    ret[mask] = ret[mask] - np.mean(image_masked)
-    ret[mask] = ret[mask] / np.var(image_masked) ** 0.5
-    ret[ret > 5.] = 5.
-    ret[ret < -5.] = -5.
-    ret += 5.
-    ret /= 10
-    ret[~mask] = 0.
+    ret = ret - np.mean(image_masked)
+    ret = ret / np.var(image_masked) ** 0.5
+    if not full_intensities_range:
+        ret[ret > 5.] = 5.
+        ret[ret < -5.] = -5.
+        ret += 5.
+        ret /= 10
+        ret[~mask] = 0.
     return ret
 
 
@@ -153,21 +185,39 @@ def resample_np(data, output_shape, order):
     return interpolation.zoom(data, zoom=factor, order=order)
 
 
-def read_image(test_data_path, series_name, sizes=(128, 128, 128)):
+def read_image(test_data_path, data_name, sizes=(128, 128, 128), is_series=True, \
+               mri_sequence_order=(0,1,2,3), full_intensities_range=False):
     images_list = []
-    handle = None
+    original_shape = ()
     bboxes = np.zeros(shape=(len(DATA_SUFFIXES),) + (2, 3))
 
-    for j, s in enumerate(DATA_SUFFIXES):
-        image_handle = read_nii_header(test_data_path, series_name, s, separate_folder=False)
-        handle = image_handle
-        image = image_handle.get_data().astype(np.float32)
+    if is_series:
+        data_seq = [DATA_SUFFIXES[i] for i in mri_sequence_order]
+        for j, s in enumerate(data_seq):
+            image_handle = read_nii_header(test_data_path, data_name + s)
+            affine = image_handle.affine
+            image = image_handle.get_data().astype(np.float32)
 
-        mask = image > 0.
-        bboxes[j] = bbox3(mask)
-        image = normalize(image, mask)
+            mask = image > 0.
+            bboxes[j] = bbox3(mask)
+            image = normalize(image, mask, full_intensities_range)
 
-        images_list.append(image.reshape((1, 1,) + image.shape))
+            images_list.append(image.reshape((1, 1,) + image.shape))
+            original_shape = image.shape
+    else:
+        data_handle = read_nii_header(test_data_path, data_name)
+        affine = data_handle.affine
+        data = data_handle.get_data().astype(np.float32)
+        assert len(data.shape) == 4, 'Wrong data dimensions - {}, must be 4'.format(len(data.shape))
+        assert data.shape[3] == 4, 'Wrong data shape - {}, must be (:,:,:,4)'.format(data.shape)
+        # Reading order is specified for data from http://medicaldecathlon.com/
+        for j in mri_sequence_order:
+            image = data[:, :, :, j]
+            mask = image > 0
+            bboxes[j] = bbox3(mask)
+            image = normalize(image, mask, full_intensities_range)
+            images_list.append(image.reshape((1, 1,) + image.shape))
+        original_shape = data.shape[:3]
 
     bbox_min = np.min(bboxes[:, 0, :], axis=0).ravel().astype(int)
     bbox_max = np.max(bboxes[:, 1, :], axis=0).ravel().astype(int)
@@ -176,10 +226,13 @@ def read_image(test_data_path, series_name, sizes=(128, 128, 128)):
     bbox[1] = bbox_max
 
     data = np.concatenate(images_list, axis=1)
-    data_crop = resample_np(
-        data[:, :, bbox_min[0]:bbox_max[0], bbox_min[1]:bbox_max[1], bbox_min[2]:bbox_max[2]],
-        (1, len(DATA_SUFFIXES),) + sizes,
-        1)
+    if data.shape[2:] == sizes:
+        data_crop = data
+    else:
+        data_crop = resample_np(
+            data[:, :, bbox_min[0]:bbox_max[0], bbox_min[1]:bbox_max[1], bbox_min[2]:bbox_max[2]],
+            (1, len(DATA_SUFFIXES),) + sizes,
+            1)
 
     bbox_ret = [
         bbox_min[0], bbox_max[0],
@@ -187,7 +240,7 @@ def read_image(test_data_path, series_name, sizes=(128, 128, 128)):
         bbox_min[2], bbox_max[2]
     ]
 
-    return data, data_crop, handle.affine, image.shape, bbox_ret
+    return data, data_crop, affine, original_shape, bbox_ret
 
 
 def main():
@@ -248,17 +301,20 @@ def main():
     if not os.path.exists(args.path_to_input_data):
         raise AttributeError("Path to input data: '{}' does not exist".format(args.path_to_input_data))
 
-    is_nifti_data = os.path.isdir(args.path_to_input_data)
+    input_type = get_input_type(args.path_to_input_data)
+    is_nifti_data = (input_type == NIFTI_FILE or input_type == NIFTI_FOLDER)
 
-    if is_nifti_data:
+    if input_type == NIFTI_FOLDER:
         series_name = find_series_name(args.path_to_input_data)
         original_data, data_crop, affine, original_size, bbox = \
-            read_image(args.path_to_input_data, series_name=series_name, sizes=(h, w, d))
+            read_image(args.path_to_input_data, data_name=series_name, sizes=(d, h, w),
+                       mri_sequence_order=args.mri_sequence, full_intensities_range=args.full_intensities_range)
 
+    elif input_type == NIFTI_FILE:
+        original_data, data_crop, affine, original_size, bbox = \
+            read_image(args.path_to_input_data, data_name=args.path_to_input_data, sizes=(d, h, w), is_series=False,
+                       mri_sequence_order=args.mri_sequence, full_intensities_range=args.full_intensities_range)
     else:
-        if not (fnmatch(args.path_to_input_data, '*.tif') or fnmatch(args.path_to_input_data, '*.tiff')):
-            raise AttributeError("Input file extension must have tiff format")
-
         data_crop = np.zeros(shape=(n, c, d, h, w), dtype=np.float)
         im_seq = ImageSequence.Iterator(Image.open(args.path_to_input_data))
         for i, page in enumerate(im_seq):
@@ -298,15 +354,29 @@ def main():
             x = bbox[1] - bbox[0]
             y = bbox[3] - bbox[2]
             z = bbox[5] - bbox[4]
-            seg_result[bbox[0]:bbox[1], bbox[2]:bbox[3], bbox[4]:bbox[5]] = \
-                np.argmax(resample_np(data, (channels, x, y, z), 1), axis=0)
-        elif channels == 1:
-            reshaped_data = data.reshape(out_d, out_h, out_w)
+            out_result = np.zeros(shape=((channels,) + original_size), dtype=float)
+            out_result[:,bbox[0]:bbox[1], bbox[2]:bbox[3], bbox[4]:bbox[5]] = \
+                resample_np(data, (channels, x, y, z), 1)
+        else:
+            out_result = data
+
+        if channels == 1:
+            reshaped_data = out_result.reshape(original_size[0], original_size[1], original_size[2])
             mask = reshaped_data[:, :, :] > 0.5
             reshaped_data[mask] = 1
             seg_result = reshaped_data.astype(int)
-        else:
-            seg_result = np.argmax(data, axis=0).astype(int)
+        elif channels == 4:
+            seg_result = np.argmax(out_result, axis=0).astype(int)
+        elif channels == 3:
+            res = np.zeros(shape=out_result.shape, dtype=bool)
+            res = out_result > 0.5
+            wt = res[0]
+            tc = res[1]
+            et = res[2]
+
+            seg_result[wt] = 2
+            seg_result[tc] = 1
+            seg_result[et] = 3
 
         im = np.stack([original_data[batch, 0, :, :, :],
                        original_data[batch, 0, :, :, :],
@@ -320,7 +390,7 @@ def main():
         mask = seg_result[:, :, :] > 0
         im[mask] = color_seg_frame[mask]
 
-        for k in range(out_d):
+        for k in range(im.shape[2]):
             if is_nifti_data:
                 list_img.append(Image.fromarray(im[:, :, k, :].astype('uint8'), 'RGB'))
             else:
@@ -335,7 +405,8 @@ def main():
 
     # --------------------------------------------- 7. Save output -----------------------------------------------
     tiff_output_name = os.path.join(args.path_to_output, 'output.tiff')
-    Image.new('RGB', (data.shape[3], data.shape[2])).save(tiff_output_name, append_images=list_img, save_all=True)
+    Image.new('RGB', (original_data.shape[3], original_data.shape[2])).save(tiff_output_name, \
+        append_images=list_img, save_all=True)
     logger.info("Result tiff file was saved to {}".format(tiff_output_name))
 
     if args.output_nifti and is_nifti_data:
@@ -344,6 +415,5 @@ def main():
             nib.save(nib.Nifti1Image(seg_res, affine=affine), nii_filename)
             logger.info("Result nifti file was saved to {}".format(nii_filename))
 
-
 if __name__ == "__main__":
     main()
diff --git a/demos/python_demos/3d_segmentation_demo/README.md b/demos/python_demos/3d_segmentation_demo/README.md
index a1423d4979f..1cb2813b63e 100644
--- a/demos/python_demos/3d_segmentation_demo/README.md
+++ b/demos/python_demos/3d_segmentation_demo/README.md
@@ -26,8 +26,8 @@ usage: 3d_segmentation_demo.py [-h] -i PATH_TO_INPUT_DATA -m PATH_TO_MODEL -o
 Options:
   -h, --help            Show this help message and exit.
   -i PATH_TO_INPUT_DATA, --path_to_input_data PATH_TO_INPUT_DATA
-                        Required. Path to an input folder with NIfTI data/TIFF
-                        file
+                        Required. Path to an input folder with NIfTI
+                        data/NIFTI file/TIFF file
   -m PATH_TO_MODEL, --path_to_model PATH_TO_MODEL
                         Required. Path to an .xml file with a trained model
   -o PATH_TO_OUTPUT, --path_to_output PATH_TO_OUTPUT
@@ -49,6 +49,10 @@ Options:
   -c PATH_TO_CLDNN_CONFIG, --path_to_cldnn_config PATH_TO_CLDNN_CONFIG
                         Required for GPU custom kernels. Absolute path to an
                         .xml file with the kernels description.
+  -ms N1,N2,N3,N4, --mri_sequence N1,N2,N3,N4
+                        Optional. Transfer MRI-sequence from dataset order to the network order.
+  --full_intensities_range
+                        Optional. Take intensities of the input image in a full range.
 ```
 
 Running the application with the empty list of options yields the usage message and an error message.
@@ -60,14 +64,23 @@ For example, to do inference on a 3D TIFF image using a trained network with mul
 command:
 
 ```
-python3 3d_segmentation_demo.py -i <path_to_image>/inputImage.tiff -m <path_to_model>/multiple-output.xml -d CPU -o <path_to_output>
+python3 3d_segmentation_demo.py -i <path_to_image>/inputImage.tiff -m <path_to_model>/brain-tumor-segmentation-0001.xml -d CPU -o <path_to_output>
 ```
      
-For example, to do inference on an 3D NIfTI image using a trained network with multiple outputs on CPU and save 
+For example, to do inference on 3D NIfTI images using a trained network with multiple outputs on CPU and save 
 output TIFF and NIFTI images, run the following command:
 ```
-python3 3d_segmentation_demo.py -i <path_to_nifti_images> -m <path_to_model>/multiple-output.xml -d CPU -o <path_to_output> -nii
+python3 3d_segmentation_demo.py -i <path_to_nifti_images> -m <path_to_model>/brain-tumor-segmentation-0001 -d CPU -o <path_to_output> -nii -ms 2,0,3,1
 ```
+For example, to do inference on a single 3D NIfTI image and save an output TIFF image, run the following command:
+```
+python3 3d_segmentation_demo.py -i <path_to_nifti_image>/PackedImage.nii -m <path_to_model>/brain-tumor-segmentation-0001 -d CPU -o <path_to_output> -ms 2,0,3,1
+```
+`-ms` option aligns input modalities that depend on a dataset. For example, [Medical Decathlon](http://medicaldecathlon.com/) brain tumor segmentation data modalities follow in different order than it's required by nets. To make a correct order using Medical Decathlon brain tumor data the correct option is `2,0,3,1` for `brain-tumor-segmentation-0001` and `1,2,3,0` for `brain-tumor-segmentation-0002`.
+```
+python3 3d_segmentation_demo.py -i <path_to_nifti_images> -m <path_to_model>/brain-tumor-segmentation-0002 -d CPU -o <path_to_output> -nii -ms 1,2,3,0 --full_intensities_range
+```
+`--full_intensities_range` option is related to preprocessing of input data. It can be different for different models, for example, `brain-tumor-segmentation-0001` expects normalized data in [0,1] range and nullified non-positive values, while `brain-tumor-segmentation-0002` just requires z-score normalization in a full range. So to use `brain-tumor-segmentation-0002` model, the flag `--full_intensities_range` should be set, while for `brain-tumor-segmentation-0001` no preprocessing option is required.
      
 ## Demo Output
 The demo outputs a multipage TIFF image and a NIFTI archive.
diff --git a/demos/python_demos/action_recognition/README.md b/demos/python_demos/action_recognition/README.md
index aa18d773fa8..3aef50f6677 100644
--- a/demos/python_demos/action_recognition/README.md
+++ b/demos/python_demos/action_recognition/README.md
@@ -60,6 +60,7 @@ Options:
   --fps FPS             Optional. FPS for renderer
   -lb LABELS, --labels LABELS
                         Optional. Path to file with label names
+  --no_show             Optional. Don't show output
 ```
 
 Running the application with an empty list of options yields the usage message given above and an error message.
diff --git a/demos/python_demos/action_recognition/action_recognition.py b/demos/python_demos/action_recognition/action_recognition.py
index 1a4cd54a0d9..b8355977fc2 100755
--- a/demos/python_demos/action_recognition/action_recognition.py
+++ b/demos/python_demos/action_recognition/action_recognition.py
@@ -28,9 +28,9 @@
 from os import path
 
 
-def video_demo(encoder, decoder, videos, fps=30, labels=None):
+def video_demo(encoder, decoder, videos, no_show, fps=30, labels=None):
     """Continuously run demo on provided video list"""
-    result_presenter = ResultRenderer(labels=labels)
+    result_presenter = ResultRenderer(no_show=no_show, labels=labels)
     run_pipeline(videos, encoder, decoder, result_presenter.render_frame, fps=fps)
 
 
@@ -54,6 +54,7 @@ def build_argparser():
                       default="CPU", type=str)
     args.add_argument("--fps", help="Optional. FPS for renderer", default=30, type=int)
     args.add_argument("-lb", "--labels", help="Optional. Path to file with label names", type=str)
+    args.add_argument("--no_show", action='store_true', help="Optional. Don't show output")
 
     return parser
 
@@ -102,7 +103,7 @@ def main():
     encoder = IEModel(encoder_xml, encoder_bin, ie, encoder_target_device,
                       num_requests=(3 if args.device == 'MYRIAD' else 1))
     decoder = IEModel(decoder_xml, decoder_bin, ie, decoder_target_device, num_requests=2)
-    video_demo(encoder, decoder, videos, args.fps, labels)
+    video_demo(encoder, decoder, videos, args.no_show, args.fps, labels)
 
 
 if __name__ == '__main__':
diff --git a/demos/python_demos/action_recognition/action_recognition_demo/result_renderer.py b/demos/python_demos/action_recognition/action_recognition_demo/result_renderer.py
index 52fe5fdaa93..8888f0284fe 100644
--- a/demos/python_demos/action_recognition/action_recognition_demo/result_renderer.py
+++ b/demos/python_demos/action_recognition/action_recognition_demo/result_renderer.py
@@ -31,8 +31,9 @@
 
 
 class ResultRenderer(object):
-    def __init__(self, display_fps=False, display_confidence=True, number_of_predictions=1, labels=None,
+    def __init__(self, no_show, display_fps=False, display_confidence=True, number_of_predictions=1, labels=None,
                  output_height=720):
+        self.no_show = no_show
         self.number_of_predictions = number_of_predictions
         self.display_confidence = display_confidence
         self.display_fps = display_fps
@@ -84,11 +85,12 @@ def render_frame(self, frame, logits, timers, frame_ind):
             cv2.putText(frame, "Inference time: {:.2f}ms ({:.2f} FPS)".format(inference_time, fps),
                         text_loc, FONT_STYLE, FONT_SIZE, FONT_COLOR)
 
-        cv2.imshow("Action Recognition", frame)
+        if not self.no_show:
+            cv2.imshow("Action Recognition", frame)
 
-        key = cv2.waitKey(1) & 0xFF
-        if key in {ord('q'), ord('Q'), 27}:
-            return -1
+            key = cv2.waitKey(1) & 0xFF
+            if key in {ord('q'), ord('Q'), 27}:
+                return -1
 
 
 class LabelPostprocessing:
diff --git a/demos/python_demos/action_recognition/action_recognition_demo/timer.py b/demos/python_demos/action_recognition/action_recognition_demo/timer.py
index a1f9e639905..07acd7e7490 100644
--- a/demos/python_demos/action_recognition/action_recognition_demo/timer.py
+++ b/demos/python_demos/action_recognition/action_recognition_demo/timer.py
@@ -60,7 +60,7 @@ def time_section(self):
         self.tock()
 
     def __repr__(self):
-        return "{:.2f}ms (±{:.2f}) {:.2f}fps".format(self.avg, self.std, self.fps)
+        return "{:.2f}ms (+/-: {:.2f}) {:.2f}fps".format(self.avg, self.std, self.fps)
 
 
 class TimerGroup:
diff --git a/demos/python_demos/asl_recognition_demo/README.md b/demos/python_demos/asl_recognition_demo/README.md
new file mode 100644
index 00000000000..74ba470bfef
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/README.md
@@ -0,0 +1,89 @@
+# ASL Recognition Python* Demo
+
+This demo demonstrates how to run ASL (American Sign Language) Recognition models using OpenVINO&trade; toolkit.
+
+## How It Works
+
+The demo application expects an ASL recognition model in the Intermediate Representation (IR) format.
+
+As input, the demo application takes:
+* a path to a video file or a device node of a web-camera specified with a command line argument `--input`
+* a path to a file in JSON format with ASL class names `--class_map`
+
+The demo workflow is the following:
+
+1. The demo application reads video frames one by one, runs person detector that extracts ROI, tracks the ROI of very first person. Additional process is used to prepare the batch of frames with constant framerate.
+2. Batch of frames and extracted ROI are passed to artificial neural network that predicts the ASL gesture.
+3. The app visualizes results of its work as graphical window where following objects are shown:
+    - Input frame with detected ROI.
+    - Last recognized ASL gesture.
+    - Performance characteristics.
+
+> **NOTE**: By default, Open Model Zoo demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html).
+
+## Running
+
+Run the application with the `-h` option to see the following usage message:
+
+```
+usage: asl_recognition_demo.py [-h] -m_a ACTION_MODEL -m_d DETECTION_MODEL -i
+                               INPUT -c CLASS_MAP [-s SAMPLES_DIR] [-d DEVICE]
+                               [-l CPU_EXTENSION] [--no_show]
+
+Options:
+  -h, --help            Show this help message and exit.
+  -m_a ACTION_MODEL, --action_model ACTION_MODEL
+                        Required. Path to an .xml file with a trained asl
+                        recognition model.
+  -m_d DETECTION_MODEL, --detection_model DETECTION_MODEL
+                        Required. Path to an .xml file with a trained person
+                        detector model.
+  -i INPUT, --input INPUT
+                        Required. Path to a video file or a device node of a
+                        web-camera.
+  -c CLASS_MAP, --class_map CLASS_MAP
+                        Required. Path to a file with ASL classes.
+  -s SAMPLES_DIR, --samples_dir SAMPLES_DIR
+                        Optional. Path to a directory with video samples of
+                        gestures.
+  -d DEVICE, --device DEVICE
+                        Optional. Specify the target device to infer on: CPU,
+                        GPU, FPGA, HDDL or MYRIAD. The demo will look for a
+                        suitable plugin for device specified (by default, it
+                        is CPU).
+  -l CPU_EXTENSION, --cpu_extension CPU_EXTENSION
+                        Optional. Required for CPU custom layers. Absolute
+                        path to a shared library with the kernels
+                        implementations.
+  --no_show             Optional. Do not visualize inference results.
+```
+
+Running the application with an empty list of options yields the short version of the usage message and an error message.
+
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (`*.xml` + `*.bin`) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+
+To run the demo, please provide paths to the ASL recognition and person detection models in the IR format, to a file with class names, and to an input video:
+```bash
+python asl_recognition_demo.py \
+-m_a /home/user/asl-recognition-0003.xml \
+-m_d /home/user/person-detection-asl-0001.xml \
+-i 0 \
+-c ./classes.json
+```
+
+An example of file with class names can be found [here](./classes.json).
+
+> **NOTE**: To run the demo application with video examples of ASL gestures specify the `-s` key with valid path to the directory with video samples. The name of each video sample should be the valid name of gesture from the `./classes.json` file. To navigate between samples use key 'n' and 'p' for iterating next and previous respectively video sample.
+
+## Demo Output
+
+The application uses OpenCV to display ASL gesture recognition result and current inference performance.
+
+![](./asl_recognition_demo.jpg)
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo.jpg b/demos/python_demos/asl_recognition_demo/asl_recognition_demo.jpg
new file mode 100644
index 00000000000..aa04fe4fe14
Binary files /dev/null and b/demos/python_demos/asl_recognition_demo/asl_recognition_demo.jpg differ
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo.py
new file mode 100755
index 00000000000..b71b436495f
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo.py
@@ -0,0 +1,184 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import logging as log
+import sys
+import time
+import json
+from os.path import exists
+from argparse import ArgumentParser, SUPPRESS
+
+import cv2
+import numpy as np
+
+from asl_recognition_demo.common import load_ie_core
+from asl_recognition_demo.video_stream import VideoStream
+from asl_recognition_demo.video_library import VideoLibrary
+from asl_recognition_demo.person_detector import PersonDetector
+from asl_recognition_demo.person_tracker import PersonTracker
+from asl_recognition_demo.action_recognizer import ActionRecognizer
+
+DETECTOR_OUTPUT_SHAPE = -1, 5
+TRACKER_SCORE_THRESHOLD = 0.5
+TRACKER_IOU_THRESHOLD = 0.5
+ACTION_NET_INPUT_FPS = 15
+ACTION_NUM_CLASSES = 100
+ACTION_IMAGE_SCALE = 256
+ACTION_SCORE_THRESHOLD = 0.8
+SAMPLES_WINDOW_SIZE = 640, 480
+
+
+def build_argparser():
+    """ Returns argument parser. """
+
+    parser = ArgumentParser(add_help=False)
+    args = parser.add_argument_group('Options')
+    args.add_argument('-h', '--help', action='help', default=SUPPRESS,
+                      help='Show this help message and exit.')
+    args.add_argument('-m_a', '--action_model',
+                      help='Required. Path to an .xml file with a trained asl recognition model.',
+                      required=True, type=str)
+    args.add_argument('-m_d', '--detection_model',
+                      help='Required. Path to an .xml file with a trained person detector model.',
+                      required=True, type=str)
+    args.add_argument('-i', '--input',
+                      help='Required. Path to a video file or a device node of a web-camera.',
+                      required=True, type=str)
+    args.add_argument('-c', '--class_map',
+                      help='Required. Path to a file with ASL classes.',
+                      required=True, type=str)
+    args.add_argument('-s', '--samples_dir',
+                      help='Optional. Path to a directory with video samples of gestures.',
+                      default=None, type=str)
+    args.add_argument('-d', '--device',
+                      help='Optional. Specify the target device to infer on: CPU, GPU, FPGA, HDDL '
+                           'or MYRIAD. The demo will look for a suitable plugin for device '
+                           'specified (by default, it is CPU).',
+                      default='CPU', type=str)
+    args.add_argument("-l", "--cpu_extension",
+                      help="Optional. Required for CPU custom layers. Absolute path to "
+                           "a shared library with the kernels implementations.", type=str,
+                      default=None)
+    args.add_argument('--no_show', action='store_true',
+                      help='Optional. Do not visualize inference results.')
+
+    return parser
+
+
+def load_class_map(file_path):
+    """ Returns class names map. """
+
+    if file_path is not None and exists(file_path):
+        with open(file_path, 'r') as input_stream:
+            data = json.load(input_stream)
+            class_map = dict(enumerate(data))
+    else:
+        class_map = None
+
+    return class_map
+
+
+def main():
+    """ Main function. """
+
+    log.basicConfig(format='[ %(levelname)s ] %(message)s', level=log.INFO, stream=sys.stdout)
+    args = build_argparser().parse_args()
+
+    ie_core = load_ie_core(args.device, args.cpu_extension)
+
+    person_detector = PersonDetector(args.detection_model, args.device, ie_core,
+                                     num_requests=2, output_shape=DETECTOR_OUTPUT_SHAPE)
+    action_recognizer = ActionRecognizer(args.action_model, args.device, ie_core,
+                                         num_requests=2, img_scale=ACTION_IMAGE_SCALE,
+                                         num_classes=ACTION_NUM_CLASSES)
+
+    video_stream = VideoStream(args.input, ACTION_NET_INPUT_FPS, action_recognizer.input_length)
+    video_stream.start()
+
+    person_tracker = PersonTracker(person_detector, TRACKER_SCORE_THRESHOLD, TRACKER_IOU_THRESHOLD)
+
+    class_map = load_class_map(args.class_map)
+    assert class_map is not None
+
+    samples_library = None
+    if args.samples_dir is not None and exists(args.samples_dir):
+        samples_library = VideoLibrary(args.samples_dir, SAMPLES_WINDOW_SIZE, list(class_map.values()))
+
+    last_caption = None
+    person_roi = None
+
+    start_time = time.perf_counter()
+    while True:
+        frame = video_stream.get_live_frame()
+        batch = video_stream.get_batch()
+        if frame is None or batch is None:
+            break
+
+        person_roi = person_tracker.get_roi(frame)
+        if person_roi is not None:
+            recognizer_result = action_recognizer(batch, person_roi)
+            if recognizer_result is not None:
+                action_class_id = np.argmax(recognizer_result)
+                action_class_label = \
+                    class_map[action_class_id] if class_map is not None else action_class_id
+
+                action_class_score = np.max(recognizer_result)
+                if action_class_score > ACTION_SCORE_THRESHOLD:
+                    last_caption = 'Last gesture: {} '.format(action_class_label)
+
+        end_time = time.perf_counter()
+        elapsed_time = end_time - start_time
+        start_time = end_time
+        current_fps = 1.0 / elapsed_time
+        cv2.putText(frame, 'FPS: {:.2f}'.format(current_fps), (10, 40),
+                    cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2)
+
+        if last_caption is not None:
+            cv2.putText(frame, last_caption, (10, frame.shape[0] - 10),
+                        cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
+
+        if person_roi is not None:
+            cv2.rectangle(frame, (person_roi[0], person_roi[1]),
+                          (person_roi[2], person_roi[3]), (128, 128, 128), 1)
+
+        if args.no_show:
+            continue
+
+        cv2.imshow('Demo', frame)
+
+        key = cv2.waitKey(1)
+        if key == 27:
+            break
+
+        if samples_library is not None:
+            sample_frame = samples_library.get_frame()
+            if sample_frame is not None:
+                cv2.imshow('Sample', sample_frame)
+
+            if key == ord('n'):
+                samples_library.next()
+            elif key == ord('p'):
+                samples_library.prev()
+
+    cv2.destroyAllWindows()
+    video_stream.release()
+    if samples_library is not None:
+        samples_library.release()
+
+
+if __name__ == '__main__':
+    sys.exit(main() or 0)
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/__init__.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/action_recognizer.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/action_recognizer.py
new file mode 100644
index 00000000000..167ad5a02ef
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/action_recognizer.py
@@ -0,0 +1,109 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import cv2
+import numpy as np
+
+from asl_recognition_demo.common import IEModel
+
+
+class ActionRecognizer(IEModel):
+    """ Class that is used to work with action recognition model. """
+
+    def __init__(self, model_path, device, ie_core, num_requests, img_scale, num_classes):
+        """Constructor"""
+
+        super().__init__(model_path, device, ie_core, num_requests)
+
+        _, _, t, h, w = self.input_size
+        self.input_height = h
+        self.input_width = w
+        self.input_length = t
+
+        self.img_scale = img_scale
+        self.num_test_classes = num_classes
+
+    @staticmethod
+    def _convert_to_central_roi(src_roi, input_height, input_width, img_scale):
+        """Extracts from the input ROI the central square part with specified side size"""
+
+        src_roi_height, src_roi_width = src_roi[3] - src_roi[1], src_roi[2] - src_roi[0]
+        src_roi_center_x = 0.5 * (src_roi[0] + src_roi[2])
+        src_roi_center_y = 0.5 * (src_roi[1] + src_roi[3])
+
+        height_scale = float(input_height) / float(img_scale)
+        width_scale = float(input_width) / float(img_scale)
+        assert height_scale < 1.0
+        assert width_scale < 1.0
+
+        min_roi_size = min(src_roi_height, src_roi_width)
+        trg_roi_height = int(height_scale * min_roi_size)
+        trg_roi_width = int(width_scale * min_roi_size)
+
+        trg_roi = [int(src_roi_center_x - 0.5 * trg_roi_width),
+                   int(src_roi_center_y - 0.5 * trg_roi_height),
+                   int(src_roi_center_x + 0.5 * trg_roi_width),
+                   int(src_roi_center_y + 0.5 * trg_roi_height)]
+
+        return trg_roi
+
+    def _process_image(self, input_image, roi):
+        """Converts input image according to model requirements"""
+
+        cropped_image = input_image[roi[1]:roi[3], roi[0]:roi[2]]
+        resized_image = cv2.resize(cropped_image, (self.input_width, self.input_height))
+        out_image = cv2.cvtColor(resized_image, cv2.COLOR_BGR2RGB)
+        return out_image.transpose(2, 0, 1).astype(np.float32)
+
+    def _prepare_net_input(self, images, roi):
+        """Converts input sequence of images into blob of data"""
+
+        data = np.stack([self._process_image(img, roi) for img in images], axis=0)
+        data = data.reshape((1,) + data.shape)
+        data = np.transpose(data, (0, 2, 1, 3, 4))
+        return data
+
+    def async_infer(self, frame_buffer, person_roi, req_id):
+        """Requests model inference for the specified batch of images"""
+
+        central_roi = self._convert_to_central_roi(person_roi,
+                                                   self.input_height, self.input_width,
+                                                   self.img_scale)
+
+        clip_data = self._prepare_net_input(frame_buffer, central_roi)
+
+        super().async_infer(clip_data, req_id)
+
+    def wait_request(self, req_id):
+        """Waits for the model output"""
+
+        result = super().wait_request(req_id)
+        if result is None:
+            return None
+        else:
+            return result[:self.num_test_classes]
+
+    def __call__(self, frame_buffer, person_roi):
+        """Runs model on the specified input"""
+
+        central_roi = self._convert_to_central_roi(person_roi,
+                                                   self.input_height, self.input_width,
+                                                   self.img_scale)
+        clip_data = self._prepare_net_input(frame_buffer, central_roi)
+
+        result = self.infer(clip_data)
+
+        return result[:self.num_test_classes]
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/common.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/common.py
new file mode 100644
index 00000000000..1870557e448
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/common.py
@@ -0,0 +1,98 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from openvino.inference_engine import IENetwork, IECore  # pylint: disable=no-name-in-module
+
+
+def load_ie_core(device, cpu_extension=None):
+    """Loads IE Core"""
+
+    ie = IECore()
+    if device == "CPU" and cpu_extension:
+        ie.add_extension(cpu_extension, "CPU")
+
+    return ie
+
+
+class IEModel:  # pylint: disable=too-few-public-methods
+    """ Class that allows worknig with Inference Engine model. """
+
+    def __init__(self, model_path, device, ie_core, num_requests, output_shape=None):
+        """Constructor"""
+        if model_path.endswith((".xml", ".bin")):
+            model_path = model_path[:-4]
+        model_xml = model_path + ".xml"
+        model_bin = model_path + ".bin"
+        self.net = IENetwork(model=model_xml, weights=model_bin)
+        assert len(self.net.inputs.keys()) == 1, "One input is expected"
+
+        supported_layers = ie_core.query_network(self.net, device)
+        not_supported_layers = [l for l in self.net.layers.keys() if l not in supported_layers]
+        if len(not_supported_layers) > 0:
+            raise RuntimeError("Following layers are not supported by the {} plugin:\n {}"
+                               .format(device, ', '.join(not_supported_layers)))
+
+        self.exec_net = ie_core.load_network(network=self.net,
+                                             device_name=device,
+                                             num_requests=num_requests)
+
+        self.input_name = next(iter(self.net.inputs))
+        if len(self.net.outputs) > 1:
+            if output_shape is not None:
+                candidates = []
+                for candidate_name in self.net.outputs:
+                    candidate_shape = self.exec_net.requests[0].outputs[candidate_name].shape
+                    if len(candidate_shape) != len(output_shape):
+                        continue
+
+                    matches = [src == trg or trg < 0
+                               for src, trg in zip(candidate_shape, output_shape)]
+                    if all(matches):
+                        candidates.append(candidate_name)
+
+                if len(candidates) != 1:
+                    raise Exception("One output is expected")
+
+                self.output_name = candidates[0]
+            else:
+                raise Exception("One output is expected")
+        else:
+            self.output_name = next(iter(self.net.outputs))
+
+        self.input_size = self.net.inputs[self.input_name].shape
+        self.output_size = self.exec_net.requests[0].outputs[self.output_name].shape
+        self.num_requests = num_requests
+
+    def infer(self, data):
+        """Runs model on the specified input"""
+
+        input_data = {self.input_name: data}
+        infer_result = self.exec_net.infer(input_data)
+        return infer_result[self.output_name]
+
+    def async_infer(self, data, req_id):
+        """Requests model inference for the specified input"""
+
+        input_data = {self.input_name: data}
+        self.exec_net.start_async(request_id=req_id, inputs=input_data)
+
+    def wait_request(self, req_id):
+        """Waits for the model output by the specified request ID"""
+
+        if self.exec_net.requests[req_id].wait(-1) == 0:
+            return self.exec_net.requests[req_id].outputs[self.output_name]
+        else:
+            return None
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_detector.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_detector.py
new file mode 100644
index 00000000000..c968092db33
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_detector.py
@@ -0,0 +1,97 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import cv2
+import numpy as np
+
+from asl_recognition_demo.common import IEModel
+
+
+class PersonDetector(IEModel):
+    """ Class that allows worknig with person detectpr models. """
+
+    def __init__(self, model_path, device, ie_core, num_requests, output_shape=None):
+        """Constructor"""
+
+        super().__init__(model_path, device, ie_core, num_requests, output_shape)
+
+        _, _, h, w = self.input_size
+        self.input_height = h
+        self.input_width = w
+
+        self.last_scales = None
+        self.last_sizes = None
+
+    def _prepare_frame(self, frame):
+        """Converts input image according model requirements"""
+
+        initial_h, initial_w = frame.shape[:2]
+        scale_h, scale_w = initial_h / float(self.input_height), initial_w / float(self.input_width)
+
+        in_frame = cv2.resize(frame, (self.input_width, self.input_height))
+        in_frame = in_frame.transpose((2, 0, 1))
+        in_frame = in_frame.reshape(self.input_size)
+
+        return in_frame, initial_h, initial_w, scale_h, scale_w
+
+    @staticmethod
+    def _process_output(result, initial_h, initial_w, scale_h, scale_w, ):
+        """Converts network output to the internal format"""
+
+        if result.shape[-1] == 5:  # format: [xmin, ymin, xmax, ymax, conf]
+            return np.array([[scale_w, scale_h, scale_w, scale_h, 1.0]]) * result
+        else:  # format: [image_id, label, conf, xmin, ymin, xmax, ymax]
+            scale_w *= initial_w
+            scale_h *= initial_h
+            out = np.array([[1.0, scale_w, scale_h, scale_w, scale_h]]) * result[0, 0, :, 2:]
+
+            return np.concatenate((out[:, 1:], out[:, 1].reshape([-1, 1])), axis=1)
+
+    def async_infer(self, frame, req_id):
+        """Requests model inference for the specified image"""
+
+        in_frame, initial_h, initial_w, scale_h, scale_w = self._prepare_frame(frame)
+        self.last_sizes = initial_h, initial_w
+        self.last_scales = scale_h, scale_w
+
+        super().async_infer(in_frame, req_id)
+
+    def wait_request(self, req_id):
+        """Waits for the model output"""
+
+        if self.last_scales is None or self.last_sizes is None:
+            raise ValueError('Unexpected request')
+
+        result = super().wait_request(req_id)
+        if result is None:
+            return None
+
+        initial_h, initial_w = self.last_sizes
+        scale_h, scale_w = self.last_scales
+
+        out = self._process_output(result, initial_h, initial_w, scale_h, scale_w)
+
+        return out
+
+
+    def __call__(self, frame):
+        """Runs model on the specified input"""
+
+        in_frame, initial_h, initial_w, scale_h, scale_w = self._prepare_frame(frame)
+        result = self.infer(in_frame)
+        out = self._process_output(result, initial_h, initial_w, scale_h, scale_w)
+
+        return out
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_tracker.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_tracker.py
new file mode 100644
index 00000000000..07880a5d1af
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/person_tracker.py
@@ -0,0 +1,126 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import numpy as np
+
+
+class PersonTracker:  # pylint: disable=too-few-public-methods
+    """ Class that allows worknig with person tracking. """
+
+    def __init__(self, detector, score_threshold, iou_threshold, smooth_weight=0.5):
+        """Constructor"""
+
+        self._detector = detector
+        self._score_threshold = score_threshold
+        self._iou_threshold = iou_threshold
+        self._smooth_weight = smooth_weight
+
+        self._last_roi = None
+        self._cur_req_id, self._next_req_id = 0, 1
+
+    @staticmethod
+    def _matrix_iou(set_a, set_b):
+        """Computes IoU metric for the two sets of vectors"""
+
+        intersect_ymin = np.maximum(set_a[:, 0].reshape([-1, 1]), set_b[:, 0].reshape([1, -1]))
+        intersect_xmin = np.maximum(set_a[:, 1].reshape([-1, 1]), set_b[:, 1].reshape([1, -1]))
+        intersect_ymax = np.minimum(set_a[:, 2].reshape([-1, 1]), set_b[:, 2].reshape([1, -1]))
+        intersect_xmax = np.minimum(set_a[:, 3].reshape([-1, 1]), set_b[:, 3].reshape([1, -1]))
+
+        intersect_heights = np.maximum(0.0, intersect_ymax - intersect_ymin)
+        intersect_widths = np.maximum(0.0, intersect_xmax - intersect_xmin)
+
+        intersect_areas = intersect_heights * intersect_widths
+        areas_set_a = ((set_a[:, 2] - set_a[:, 0]) * (set_a[:, 3] - set_a[:, 1])).reshape([-1, 1])
+        areas_set_b = ((set_b[:, 2] - set_b[:, 0]) * (set_b[:, 3] - set_b[:, 1])).reshape([1, -1])
+
+        areas_set_a[np.less(areas_set_a, 0.0)] = 0.0
+        areas_set_b[np.less(areas_set_b, 0.0)] = 0.0
+
+        union_areas = areas_set_a + areas_set_b - intersect_areas
+
+        iou_values = intersect_areas / union_areas
+        iou_values[np.less_equal(union_areas, 0.0)] = 0.0
+
+        return iou_values
+
+    def _track(self, last_roi, new_detections, score_threshold, iou_threshold):
+        """Adds new detections and tracks the very first bounding box"""
+
+        valid_ids = np.where(new_detections[:, 4] > score_threshold)[0]
+        if len(valid_ids) == 0:
+            return None
+
+        filtered_detections = new_detections[valid_ids, :4]
+
+        new_roi = None
+        if last_roi is not None:
+            iou_values = self._matrix_iou(last_roi.reshape([1, -1]), filtered_detections)
+            iou_values = iou_values.reshape([-1])
+
+            best_match_id = np.argmax(iou_values)
+            best_match_value = iou_values[best_match_id]
+            if best_match_value > iou_threshold:
+                new_roi = filtered_detections[best_match_id]
+
+        if new_roi is None:
+            det_heights = filtered_detections[:, 3] - filtered_detections[:, 1]
+            det_widths = filtered_detections[:, 2] - filtered_detections[:, 0]
+            det_squares = det_heights * det_widths
+
+            best_det_id = np.argmax(det_squares)
+            new_roi = filtered_detections[best_det_id]
+
+        return new_roi
+
+    @staticmethod
+    def _smooth_roi(last_roi, new_roi, weight):
+        """Smooths tracking ROI"""
+
+        if last_roi is None:
+            return new_roi
+
+        return weight * last_roi + (1.0 - weight) * new_roi
+
+    @staticmethod
+    def _clip_roi(roi, frame_size):
+        """Clips ROI limits according frame sizes"""
+
+        frame_height, frame_width = frame_size
+        return [np.maximum(0, int(roi[0])),
+                np.maximum(0, int(roi[1])),
+                np.minimum(frame_width, int(roi[2])),
+                np.minimum(frame_height, int(roi[3]))]
+
+    def get_roi(self, frame):
+        """Returns ROI of tracked person"""
+
+        self._detector.async_infer(frame, self._next_req_id)
+
+        detections = self._detector.wait_request(self._cur_req_id)
+
+        out_roi = None
+        if detections is not None:
+            new_roi = self._track(self._last_roi, detections,
+                                  self._score_threshold, self._iou_threshold)
+            if new_roi is not None:
+                smoothed_roi = self._smooth_roi(self._last_roi, new_roi, self._smooth_weight)
+                out_roi = self._clip_roi(smoothed_roi, frame.shape[:2])
+
+        self._cur_req_id, self._next_req_id = self._next_req_id, self._cur_req_id
+        self._last_roi = np.array(out_roi, dtype=np.float32) if out_roi is not None else None
+
+        return np.array(out_roi, dtype=np.int32) if out_roi is not None else None
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_library.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_library.py
new file mode 100644
index 00000000000..7df2ca12858
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_library.py
@@ -0,0 +1,121 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from os import listdir
+from os.path import join, isfile
+
+import cv2
+
+
+class VideoLibrary:
+    """ This class loads list of videos and plays each one in cycle. """
+
+    def __init__(self, source_dir, trg_size, class_names):
+        """Constructor"""
+
+        self.trg_size = trg_size
+
+        self.source_paths = self.parse_source_paths(source_dir, class_names)
+        assert len(self.source_paths) > 0, "Can't find videos in " + str(source_dir)
+
+        self.cur_source_id = 0
+        self.cap = None
+
+    @property
+    def num_sources(self):
+        """Returns number of videos in the library"""
+
+        return len(self.source_paths)
+
+    @property
+    def cur_source(self):
+        """Returns the path to the current video source"""
+
+        return self.source_paths[self.cur_source_id]
+
+    @staticmethod
+    def parse_source_paths(input_dir, valid_names):
+        """Returns the list of valid video sources"""
+
+        valid_names = set(n.lower() for n in valid_names)
+        all_file_paths = [f for f in listdir(input_dir) if isfile(join(input_dir, f))]
+        all_file_paths.sort()
+
+        out_file_paths = []
+        for file_path in all_file_paths:
+            file_name = file_path.split('.')[0].lower()
+            if file_name not in valid_names:
+                continue
+
+            full_file_path = join(input_dir, file_path)
+
+            cap = cv2.VideoCapture(full_file_path)
+            if not cap.isOpened():
+                continue
+
+            num_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+            cap.release()
+
+            if num_frames > 0:
+                out_file_paths.append((file_name, full_file_path))
+
+        return out_file_paths
+
+    def release(self):
+        """Release internal storages"""
+
+        if self.cap is not None:
+            self.cap.release()
+
+        self.cap = None
+
+    def next(self):
+        """Moves pointer to the next video source"""
+
+        self.release()
+
+        self.cur_source_id += 1
+        if self.cur_source_id >= self.num_sources:
+            self.cur_source_id = 0
+
+    def prev(self):
+        """Moves pointer to the previous video source"""
+
+        self.release()
+
+        self.cur_source_id -= 1
+        if self.cur_source_id < 0:
+            self.cur_source_id = self.num_sources - 1
+
+    def get_frame(self):
+        """Returns current frame from the active video source"""
+
+        source_name, source_path = self.cur_source
+
+        if self.cap is None:
+            self.cap = cv2.VideoCapture(source_path)
+
+        _, frame = self.cap.read()
+        if frame is None:
+            self.cap.set(cv2.CAP_PROP_POS_FRAMES, 0)
+            _, frame = self.cap.read()
+            assert frame is not None
+
+        frame = cv2.resize(frame, self.trg_size)
+        cv2.putText(frame, 'Gesture: {}'.format(source_name), (10, frame.shape[0] - 10),
+                    cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 0), 2)
+
+        return frame
diff --git a/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_stream.py b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_stream.py
new file mode 100644
index 00000000000..ca64648fe10
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/asl_recognition_demo/video_stream.py
@@ -0,0 +1,176 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import time
+from os.path import exists
+from multiprocessing import Process, Value, Array
+
+import cv2
+import numpy as np
+
+
+class VideoStream:
+    """ This class returns constant framerate frames from the input stream. """
+
+    def __init__(self, input_source, trg_fps, batch_size):
+        """Constructor"""
+
+        try:
+            self._input_source = int(input_source)
+        except ValueError:
+            self._input_source = input_source
+
+        self._trg_fps = trg_fps
+        assert self._trg_fps > 0
+        self._batch_size = batch_size
+        assert self._batch_size > 0
+
+        cap = cv2.VideoCapture(self._input_source)
+        assert cap.isOpened(), "Can't open " + str(self._input_source)
+
+        source_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        source_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        cap.release()
+
+        self._image_shape = [source_height, source_width, 3]
+        self._batch_shape = [batch_size] + self._image_shape
+
+        self._image_buffer_size = int(np.prod(self._image_shape))
+        self._batch_buffer_size = int(np.prod(self._batch_shape))
+
+        self._source_finished = Value('i', False, lock=False)
+        self._raw_frame = Array('B', self._image_buffer_size, lock=True)
+        self._slow_frame = Array('B', self._image_buffer_size, lock=True)
+        self._slow_batch = Array('B', self._batch_buffer_size, lock=True)
+
+        self._frame_generator_process = None
+        self._producer_process = None
+
+    def get_live_frame(self):
+        """Returns last live frame from the input stream"""
+
+        if self._source_finished.value:
+            return None
+
+        with self._raw_frame.get_lock():
+            buffer = np.frombuffer(self._raw_frame.get_obj(), dtype=np.uint8)
+            frame = np.copy(buffer.reshape(self._image_shape))
+
+        return frame
+
+    def get_batch(self):
+        """Returns last batch of frames with constant framerate from the input stream"""
+
+        if self._source_finished.value:
+            return None
+
+        with self._slow_batch.get_lock():
+            buffer = np.frombuffer(self._slow_batch.get_obj(), dtype=np.uint8)
+            batch = np.copy(buffer.reshape(self._batch_shape))
+
+        return batch
+
+    def start(self):
+        """Starts internal threads"""
+
+        self._frame_generator_process = \
+            Process(target=self._frame_generator,
+                    args=(self._input_source, self._raw_frame, self._image_shape,
+                          self._source_finished))
+        self._frame_generator_process.daemon = True
+        self._frame_generator_process.start()
+
+        self._producer_process = \
+            Process(target=self._producer,
+                    args=(self._raw_frame, self._slow_frame, self._slow_batch,
+                          self._trg_fps, self._batch_size, self._image_shape,
+                          self._source_finished))
+        self._producer_process.daemon = True
+        self._producer_process.start()
+
+    def release(self):
+        """Release internal threads"""
+
+        if self._frame_generator_process is not None:
+            self._frame_generator_process.terminate()
+
+        if self._producer_process is not None:
+            self._producer_process.terminate()
+
+    @staticmethod
+    def _frame_generator(input_source, out_frame, frame_shape, finish_flag):
+        """Produces live frames from the input stream"""
+
+        cap = cv2.VideoCapture(input_source)
+        cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)
+
+        source_fps = cap.get(cv2.CAP_PROP_FPS)
+        trg_time_step = 1.0 / float(source_fps)
+
+        start_time = time.perf_counter()
+        while True:
+            _, frame = cap.read()
+            if frame is None:
+                break
+
+            with out_frame.get_lock():
+                buffer = np.frombuffer(out_frame.get_obj(), dtype=np.uint8)
+                np.copyto(buffer.reshape(frame_shape), frame)
+
+            end_time = time.perf_counter()
+            elapsed_time = end_time - start_time
+            start_time = end_time
+            rest_time = trg_time_step - elapsed_time
+            if rest_time > 0.0:
+                time.sleep(rest_time)
+
+        finish_flag.value = True
+        cap.release()
+
+    @staticmethod
+    def _producer(input_frame, out_frame, out_batch, trg_fps, batch_size, image_shape, finish_flag):
+        """Produces frames and batch of frames with constant framerate
+           from the internal stream of frames"""
+
+        trg_time_step = 1.0 / float(trg_fps)
+        batch_shape = [batch_size] + image_shape
+        frame_buffer = []
+
+        start_time = time.perf_counter()
+        while not finish_flag.value:
+            with input_frame.get_lock():
+                in_frame_buffer = np.frombuffer(input_frame.get_obj(), dtype=np.uint8)
+                frame = np.copy(in_frame_buffer.reshape(image_shape))
+
+            with out_frame.get_lock():
+                out_frame_buffer = np.frombuffer(out_frame.get_obj(), dtype=np.uint8)
+                np.copyto(out_frame_buffer.reshape(image_shape), frame)
+
+            frame_buffer.append(frame)
+            if len(frame_buffer) > batch_size:
+                frame_buffer = frame_buffer[-batch_size:]
+
+            if len(frame_buffer) == batch_size:
+                with out_batch.get_lock():
+                    out_batch_buffer = np.frombuffer(out_batch.get_obj(), dtype=np.uint8)
+                    np.copyto(out_batch_buffer.reshape(batch_shape), frame_buffer)
+
+            end_time = time.perf_counter()
+            elapsed_time = end_time - start_time
+            start_time = end_time
+            rest_time = trg_time_step - elapsed_time
+            if rest_time > 0.0:
+                time.sleep(rest_time)
diff --git a/demos/python_demos/asl_recognition_demo/classes.json b/demos/python_demos/asl_recognition_demo/classes.json
new file mode 100644
index 00000000000..b06cbb0c92f
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/classes.json
@@ -0,0 +1,101 @@
+["hello",
+"nice",
+"teacher",
+"eat",
+"no",
+"happy",
+"like",
+"orange",
+"want",
+"deaf",
+"school",
+"sister",
+"finish",
+"white",
+"bird",
+"what",
+"tired",
+"friend",
+"sit",
+"mother",
+"yes",
+"student",
+"learn",
+"spring",
+"good",
+"fish",
+"again",
+"sad",
+"table",
+"need",
+"where",
+"father",
+"milk",
+"cousin",
+"brother",
+"paper",
+"forget",
+"nothing",
+"book",
+"girl",
+"fine",
+"black",
+"boy",
+"lost",
+"family",
+"hearing",
+"bored",
+"please",
+"water",
+"computer",
+"help",
+"doctor",
+"yellow",
+"write",
+"hungry",
+"but",
+"drink",
+"bathroom",
+"man",
+"how",
+"understand",
+"red",
+"beautiful",
+"sick",
+"blue",
+"green",
+"english",
+"name",
+"you",
+"who",
+"same",
+"nurse",
+"day",
+"now",
+"brown",
+"thanks",
+"hurt",
+"here",
+"grandmother",
+"pencil",
+"walk",
+"bad",
+"read",
+"when",
+"dance",
+"play",
+"sign",
+"go",
+"big",
+"sorry",
+"work",
+"draw",
+"grandfather",
+"woman",
+"right",
+"france",
+"pink",
+"know",
+"live",
+"night"
+]
diff --git a/demos/python_demos/asl_recognition_demo/models.lst b/demos/python_demos/asl_recognition_demo/models.lst
new file mode 100644
index 00000000000..76c3c505099
--- /dev/null
+++ b/demos/python_demos/asl_recognition_demo/models.lst
@@ -0,0 +1,3 @@
+# This file can be used with the --list option of the model downloader.
+asl-recognition-????
+person-detection-asl-????
diff --git a/demos/python_demos/colorization_demo/README.md b/demos/python_demos/colorization_demo/README.md
new file mode 100644
index 00000000000..f85a343763b
--- /dev/null
+++ b/demos/python_demos/colorization_demo/README.md
@@ -0,0 +1,56 @@
+# Colorization Demo
+
+This demo demonstrates an example of using neural networks to colorize a video.
+You can use the following models with the demo:
+
+* `colorization-v2`
+* `colorization-v2-norebal`
+
+For more information about the pre-trained models, refer to the [model documentation](../../../models/public/index.md).
+
+### How it works
+
+On the start-up, the application reads command line parameters and loads one network to the Inference Engine for execution.
+
+Having received the image, the program:
+1) converts the frame of video into LAB color space
+2) uses the L-channel to predict A and B channels
+3) restores the image, by converting it into BGR color space
+
+### Running the demo:
+
+Running the application with the `-h` option yields the following usage message:
+
+```
+colorization_demo.py -h
+
+usage: colorization_demo.py [-h] -m MODEL --coeffs COEFFS [-d DEVICE] -i
+                            "<path>" [--no_show] [-v]
+
+Options:
+  -h, --help            Help with the script.
+  -m MODEL, --model MODEL
+                        Required. Path to .xml file with pre-trained model.
+  --coeffs COEFFS       Required. Path to .npy file with color coefficients.
+  -d DEVICE, --device DEVICE
+                        Optional. Specify target device for infer: CPU, GPU,
+                        FPGA, HDDL or MYRIAD. Default: CPU
+  -i "<path>", --input "<path>"
+                        Required. Input to process.
+  --no_show             Optional. Disable display of results on screen.
+  -v, --verbose         Optional. Enable display of processing logs on screen.
+```
+
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (\*.xml + \*.bin) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+
+### Demo output
+
+The demo uses OpenCV to display the colorized frame.
+
+## See also
+
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/colorization_demo/colorization_demo.py b/demos/python_demos/colorization_demo/colorization_demo.py
new file mode 100644
index 00000000000..75f4a598888
--- /dev/null
+++ b/demos/python_demos/colorization_demo/colorization_demo.py
@@ -0,0 +1,138 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2018 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from openvino.inference_engine import IENetwork, IECore
+import cv2 as cv
+import numpy as np
+import os
+from argparse import ArgumentParser, SUPPRESS
+import logging as log
+import sys
+
+
+def build_arg():
+    parser = ArgumentParser(add_help=False)
+    in_args = parser.add_argument_group('Options')
+    in_args.add_argument('-h', '--help', action='help', default=SUPPRESS, help='Help with the script.')
+    in_args.add_argument("-m", "--model", help="Required. Path to .xml file with pre-trained model.",
+                         required=True, type=str)
+    in_args.add_argument("--coeffs", help="Required. Path to .npy file with color coefficients.",
+                         required=True, type=str)
+    in_args.add_argument("-d", "--device",
+                         help="Optional. Specify target device for infer: CPU, GPU, FPGA, HDDL or MYRIAD. "
+                              "Default: CPU",
+                         default="CPU", type=str)
+    in_args.add_argument('-i', "--input",
+                         help='Required. Input to process.',
+                         required=True, type=str, metavar='"<path>"')
+    in_args.add_argument("--no_show", help="Optional. Disable display of results on screen.",
+                         action='store_true', default=False)
+    in_args.add_argument("-v", "--verbose", help="Optional. Enable display of processing logs on screen.",
+                         action='store_true', default=False)
+    return parser
+
+
+if __name__ == '__main__':
+    args = build_arg().parse_args()
+    model_path = os.path.splitext(args.model)[0]
+    weights_bin = model_path + ".bin"
+    coeffs = args.coeffs
+
+    # mean is stored in the source caffe model and passed to IR
+    log.basicConfig(format="[ %(levelname)s ] %(message)s",
+                    level=log.INFO if not args.verbose else log.DEBUG, stream=sys.stdout)
+
+    log.debug("Load network")
+    load_net = IENetwork(model=args.model, weights=weights_bin)
+    load_net.batch_size = 1
+    exec_net = IECore().load_network(network=load_net, device_name=args.device)
+
+    assert len(load_net.inputs) == 1, "Expected number of inputs is equal 1"
+    input_blob = next(iter(load_net.inputs))
+    input_shape = load_net.inputs[input_blob].shape
+    assert input_shape[1] == 1, "Expected model input shape with 1 channel"
+
+    assert len(load_net.outputs) == 1, "Expected number of outputs is equal 1"
+    output_blob = next(iter(load_net.outputs))
+    output_shape = load_net.outputs[output_blob].shape
+    assert output_shape == [1, 313, 56, 56], "Shape of outputs does not match network shape outputs"
+
+    _, _, h_in, w_in = input_shape
+
+    try:
+        input_source = int(args.input)
+    except ValueError:
+        input_source = args.input
+
+    cap = cv.VideoCapture(input_source)
+    if not cap.isOpened():
+        assert "{} not exist".format(input_source)
+
+    color_coeff = np.load(coeffs).astype(np.float32)
+    assert color_coeff.shape == (313, 2), "Current shape of color coefficients does not match required shape"
+
+    while True:
+        log.debug("#############################")
+        hasFrame, original_frame = cap.read()
+        if not hasFrame:
+            break
+        (h_orig, w_orig) = original_frame.shape[:2]
+
+        log.debug("Preprocessing frame")
+        if original_frame.shape[2] > 1:
+            frame = cv.cvtColor(cv.cvtColor(original_frame, cv.COLOR_BGR2GRAY), cv.COLOR_GRAY2RGB)
+        else:
+            frame = cv.cvtColor(original_frame, cv.COLOR_GRAY2RGB)
+
+        img_rgb = frame.astype(np.float32) / 255
+        img_lab = cv.cvtColor(img_rgb, cv.COLOR_RGB2Lab)
+        img_l_rs = cv.resize(img_lab.copy(), (w_in, h_in))[:, :, 0]
+
+        log.debug("Network inference")
+        res = exec_net.infer(inputs={input_blob: [img_l_rs]})
+
+        update_res = (res[output_blob] * color_coeff.transpose()[:, :, np.newaxis, np.newaxis]).sum(1)
+
+        log.debug("Get results")
+        out = update_res.transpose((1, 2, 0))
+        out = cv.resize(out, (w_orig, h_orig))
+        img_lab_out = np.concatenate((img_lab[:, :, 0][:, :, np.newaxis], out), axis=2)
+        img_bgr_out = np.clip(cv.cvtColor(img_lab_out, cv.COLOR_Lab2BGR), 0, 1)
+
+        if not args.no_show:
+            log.debug("Show results")
+            imshowSize = (640, 480)
+            original_image = cv.resize(original_frame, imshowSize)
+            grayscale_image = cv.resize(frame, imshowSize)
+            colorize_image = (cv.resize(img_bgr_out, imshowSize) * 255).astype(np.uint8)
+            lab_image = (cv.resize(img_lab_out, imshowSize)).astype(np.uint8)
+
+            original_image = cv.putText(original_image, 'Original', (25, 50),
+                                        cv.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv.LINE_AA)
+            grayscale_image = cv.putText(grayscale_image, 'Grayscale', (25, 50),
+                                        cv.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv.LINE_AA)
+            colorize_image = cv.putText(colorize_image, 'Colorize', (25, 50),
+                                        cv.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv.LINE_AA)
+            lab_image = cv.putText(lab_image, 'LAB interpetation', (25, 50),
+                                   cv.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv.LINE_AA)
+
+            ir_image = [cv.hconcat([original_image, grayscale_image]),
+                        cv.hconcat([lab_image, colorize_image])]
+            final_image = cv.vconcat(ir_image)
+            cv.imshow('Colorization Demo', final_image)
+            if not cv.waitKey(1) < 0:
+                break
diff --git a/demos/python_demos/colorization_demo/models.lst b/demos/python_demos/colorization_demo/models.lst
new file mode 100644
index 00000000000..408e0e267a8
--- /dev/null
+++ b/demos/python_demos/colorization_demo/models.lst
@@ -0,0 +1,3 @@
+# This file can be used with the --list option of the model downloader.
+colorization-v2
+colorization-v2-norebal
diff --git a/demos/python_demos/face_recognition_demo/README.md b/demos/python_demos/face_recognition_demo/README.md
index 14f21920d2a..e74b301cc2b 100644
--- a/demos/python_demos/face_recognition_demo/README.md
+++ b/demos/python_demos/face_recognition_demo/README.md
@@ -71,15 +71,18 @@ pip install -r requirements.txt
 Running the application with the `-h` option or without
 any arguments yields the following message:
 
-``` sh
+```
 python ./face_recognition_demo.py -h
 
 usage: face_recognition_demo.py [-h] [-i PATH] [-o PATH] [--no_show] [-tl]
-                                [-cw CROP_WIDTH] [-ch CROP_HEIGHT] -fg PATH
+                                [-cw CROP_WIDTH] [-ch CROP_HEIGHT]
+                                [--match_algo {HUNGARIAN,MIN_DIST}] -fg PATH
                                 [--run_detector] -m_fd PATH -m_lm PATH -m_reid
-                                PATH [-d_fd {CPU,GPU,FPGA,MYRIAD,HETERO}]
-                                [-d_lm {CPU,GPU,FPGA,MYRIAD,HETERO}]
-                                [-d_reid {CPU,GPU,FPGA,MYRIAD,HETERO}]
+                                PATH [-fd_iw FD_INPUT_WIDTH]
+                                [-fd_ih FD_INPUT_HEIGHT]
+                                [-d_fd {CPU,GPU,FPGA,MYRIAD,HETERO,HDDL}]
+                                [-d_lm {CPU,GPU,FPGA,MYRIAD,HETERO,HDDL}]
+                                [-d_reid {CPU,GPU,FPGA,MYRIAD,HETERO,HDDL}]
                                 [-l PATH] [-c PATH] [-v] [-pc] [-t_fd [0..1]]
                                 [-t_id [0..1]] [-exp_r_fd NUMBER]
 
@@ -102,6 +105,9 @@ General:
                         (optional) Crop the input stream to this height
                         (default: no crop). Both -cw and -ch parameters should
                         be specified to use crop.
+  --match_algo {HUNGARIAN,MIN_DIST}
+                        (optional)algorithm for face matching(default:
+                        HUNGARIAN)
 
 Faces database:
   -fg PATH              Path to the face images directory
@@ -122,6 +128,16 @@ Models:
   -m_fd PATH            Path to the Face Detection model XML file
   -m_lm PATH            Path to the Facial Landmarks Regression model XML file
   -m_reid PATH          Path to the Face Reidentification model XML file
+  -fd_iw FD_INPUT_WIDTH, --fd_input_width FD_INPUT_WIDTH
+                        (optional) specify the input width of detection model
+                        (default: use default input width of model).
+                        Both -fd_iw and -fd_ih parameters should be specified
+                        for reshape.
+  -fd_ih FD_INPUT_HEIGHT, --fd_input_height FD_INPUT_HEIGHT
+                        (optional) specify the input height of detection model
+                        (default: use default input height of model). 
+                        Both -fd_iw and -fd_ih parameters should be specified
+                        for reshape.
 
 Inference options:
   -d_fd {CPU,GPU,FPGA,MYRIAD,HETERO}
@@ -163,14 +179,13 @@ python ./face_recognition_demo.py \
 -m_fd <path_to_model>/face-detection-retail-0004.xml \
 -m_lm <path_to_model>/landmarks-regression-retail-0009.xml \
 -m_reid <path_to_model>/face-reidentification-retail-0095.xml \
--l <path_to_cpu_extensions>/libcpu_extension_sse4.so \
 --verbose \
 -fg "/home/face_gallery"
 ```
 
 Windows (`cmd`, `powershell`) (assuming OpenVINO installed in `C:/Intel/openvino`):
 
-``` powershell
+```bat
 # Set up the environment
 call C:/Intel/openvino/bin/setupvars.bat
 
@@ -178,7 +193,6 @@ python ./face_recognition_demo.py ^
 -m_fd <path_to_model>/face-detection-retail-0004.xml ^
 -m_lm <path_to_model>/landmarks-regression-retail-0009.xml ^
 -m_reid <path_to_model>/face-reidentification-retail-0095.xml ^
--l <path_to_cpu_extensions>/cpu_extension_avx2.dll ^
 --verbose ^
 -fg "C:/face_gallery"
 ```
diff --git a/demos/python_demos/face_recognition_demo/face_identifier.py b/demos/python_demos/face_recognition_demo/face_identifier.py
index 9a54dea0714..95c696b2d17 100644
--- a/demos/python_demos/face_recognition_demo/face_identifier.py
+++ b/demos/python_demos/face_recognition_demo/face_identifier.py
@@ -39,7 +39,7 @@ def __init__(self, id, distance, desc):
             self.distance = distance
             self.descriptor = desc
 
-    def __init__(self, model, match_threshold=0.5):
+    def __init__(self, model, match_threshold=0.5, match_algo='HUNGARIAN'):
         super(FaceIdentifier, self).__init__(model)
 
         assert len(model.inputs) == 1, "Expected 1 input blob"
@@ -57,6 +57,7 @@ def __init__(self, model, match_threshold=0.5):
         self.faces_database = None
 
         self.match_threshold = match_threshold
+        self.match_algo = match_algo
 
     def set_faces_database(self, database):
         self.faces_database = database
@@ -89,7 +90,7 @@ def get_matches(self):
 
         matches = []
         if len(descriptors) != 0:
-            matches = self.faces_database.match_faces(descriptors)
+            matches = self.faces_database.match_faces(descriptors, self.match_algo)
 
         results = []
         unknowns_list = []
diff --git a/demos/python_demos/face_recognition_demo/face_recognition_demo.py b/demos/python_demos/face_recognition_demo/face_recognition_demo.py
index 531fb6e6148..a7d0ece4f9e 100755
--- a/demos/python_demos/face_recognition_demo/face_recognition_demo.py
+++ b/demos/python_demos/face_recognition_demo/face_recognition_demo.py
@@ -32,6 +32,7 @@
 from face_identifier import FaceIdentifier
 
 DEVICE_KINDS = ['CPU', 'GPU', 'FPGA', 'MYRIAD', 'HETERO', 'HDDL']
+MATCH_ALGO = ['HUNGARIAN', 'MIN_DIST']
 
 
 def build_argparser():
@@ -55,6 +56,8 @@ def build_argparser():
                          help="(optional) Crop the input stream to this height " \
                          "(default: no crop). Both -cw and -ch parameters " \
                          "should be specified to use crop.")
+    general.add_argument('--match_algo', default='HUNGARIAN', choices=MATCH_ALGO,
+                         help="(optional)algorithm for face matching(default: %(default)s)")
 
     gallery = parser.add_argument_group('Faces database')
     gallery.add_argument('-fg', metavar="PATH", required=True,
@@ -70,7 +73,15 @@ def build_argparser():
                         help="Path to the Facial Landmarks Regression model XML file")
     models.add_argument('-m_reid', metavar="PATH", default="", required=True,
                         help="Path to the Face Reidentification model XML file")
-
+    models.add_argument('-fd_iw', '--fd_input_width', default=0, type=int,
+                         help="(optional) specify the input width of detection model " \
+                         "(default: use default input width of model). Both -fd_iw and -fd_ih parameters " \
+                         "should be specified for reshape.")
+    models.add_argument('-fd_ih', '--fd_input_height', default=0, type=int,
+                         help="(optional) specify the input height of detection model " \
+                         "(default: use default input height of model). Both -fd_iw and -fd_ih parameters " \
+                         "should be specified for reshape.")
+    
     infer = parser.add_argument_group('Inference options')
     infer.add_argument('-d_fd', default='CPU', choices=DEVICE_KINDS,
                        help="(optional) Target device for the " \
@@ -122,15 +133,24 @@ def __init__(self, args):
 
         log.info("Loading models")
         face_detector_net = self.load_model(args.m_fd)
+        
+        assert (args.fd_input_height and args.fd_input_width) or \
+               (args.fd_input_height==0 and args.fd_input_width==0), \
+            "Both -fd_iw and -fd_ih parameters should be specified for reshape"
+        
+        if args.fd_input_height and args.fd_input_width :
+            face_detector_net.reshape({"data": [1, 3, args.fd_input_height,args.fd_input_width]})
         landmarks_net = self.load_model(args.m_lm)
         face_reid_net = self.load_model(args.m_reid)
 
         self.face_detector = FaceDetector(face_detector_net,
                                           confidence_threshold=args.t_fd,
                                           roi_scale_factor=args.exp_r_fd)
+
         self.landmarks_detector = LandmarksDetector(landmarks_net)
         self.face_identifier = FaceIdentifier(face_reid_net,
-                                              match_threshold=args.t_id)
+                                              match_threshold=args.t_id,
+                                              match_algo = args.match_algo)
 
         self.face_detector.deploy(args.d_fd, context)
         self.landmarks_detector.deploy(args.d_lm, context,
diff --git a/demos/python_demos/face_recognition_demo/faces_database.py b/demos/python_demos/face_recognition_demo/faces_database.py
index 7ead34bb193..b81eb3bd43b 100644
--- a/demos/python_demos/face_recognition_demo/faces_database.py
+++ b/demos/python_demos/face_recognition_demo/faces_database.py
@@ -149,7 +149,7 @@ def ask_to_save(self, image):
         label = name if save else None
         return label
 
-    def match_faces(self, descriptors):
+    def match_faces(self, descriptors, match_algo='HUNGARIAN'):
         database = self.database
         distances = np.empty((len(descriptors), len(database)))
         for i, desc in enumerate(descriptors):
@@ -159,17 +159,25 @@ def match_faces(self, descriptors):
                     dist.append(FacesDatabase.Identity.cosine_dist(desc, id_desc))
                 distances[i][j] = dist[np.argmin(dist)]
 
-        # Find best assignments, prevent repeats, assuming faces can not repeat
-        _, assignments = linear_sum_assignment(distances)
         matches = []
-        for i in range(len(descriptors)):
-            if len(assignments) <= i: # assignment failure, too many faces
-                matches.append((0, 1.0))
-                continue
+        # if user specify MIN_DIST for face matching, face with minium cosine distance will be selected.
+        if match_algo == 'MIN_DIST':
+            for i in range(len(descriptors)):
+                id = np.argmin(distances[i])
+                min_dist = distances[i][id]
+                matches.append((id, min_dist))
+        else:
+            # Find best assignments, prevent repeats, assuming faces can not repeat
+            _, assignments = linear_sum_assignment(distances)
+            for i in range(len(descriptors)):
+                if len(assignments) <= i: # assignment failure, too many faces
+                    matches.append((0, 1.0))
+                    continue
+
+                id = assignments[i]
+                distance = distances[i, id]
+                matches.append((id, distance))
 
-            id = assignments[i]
-            distance = distances[i, id]
-            matches.append((id, distance))
         return matches
 
     def create_new_label(self, path, id):
diff --git a/demos/python_demos/face_recognition_demo/models.lst b/demos/python_demos/face_recognition_demo/models.lst
new file mode 100644
index 00000000000..cdd4d6b4667
--- /dev/null
+++ b/demos/python_demos/face_recognition_demo/models.lst
@@ -0,0 +1,6 @@
+# This file can be used with the --list option of the model downloader.
+face-detection-adas-????
+face-detection-adas-binary-????
+face-detection-retail-????
+face-reidentification-retail-????
+landmarks-regression-retail-????
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/README.md b/demos/python_demos/human_pose_estimation_3d_demo/README.md
new file mode 100644
index 00000000000..8f6dc625c7d
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/README.md
@@ -0,0 +1,85 @@
+# 3D Human Pose Estimation Python* Demo
+
+This demo demonstrates how to run 3D Human Pose Estimation models using OpenVINO&trade;. The following pre-trained models can be used:
+
+* `human-pose-estimation-3d-0001`.
+
+For more information about the pre-trained models, refer to the [model documentation](../../../models/public/index.md).
+
+> **NOTE**: Only batch size of 1 is supported.
+## How It Works
+
+The demo application expects a 3D human pose estimation model in the Intermediate Representation (IR) format.
+
+As input, the demo application can take:
+* a path to a video file or a device node of a web-camera.
+* a list of image paths.
+
+The demo workflow is the following:
+
+1. The demo application reads video frames one by one and estimates 3D human poses in a given frame.
+2. The app visualizes results of its work as graphical window with 2D poses, which are overlaid on input image, and canvas with corresponding 3D poses.
+
+> **NOTE**: By default, Open Model Zoo demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html).
+## Prerequisites
+
+This demo application requires a native Python extension module to be built before you can run it.
+Refer to [Using Open Model Zoo demos](../../README.md), for instructions on how to build it and prepare the environment for running the demo.
+
+## Running
+
+Run the application with the `-h` option to see the following usage message:
+
+```
+usage: human_pose_estimation_3d_demo.py [-h] -m MODEL [-i INPUT [INPUT ...]]
+                                        [-d DEVICE]
+                                        [--height_size HEIGHT_SIZE]
+                                        [--extrinsics_path EXTRINSICS_PATH]
+                                        [--fx FX] [--no_show]
+
+Lightweight 3D human pose estimation demo. Press esc to exit, "p" to (un)pause
+video or process next image.
+
+Options:
+  -h, --help            Show this help message and exit.
+  -m MODEL, --model MODEL
+                        Required. Path to an .xml file with a trained model.
+  -i INPUT [INPUT ...], --input INPUT [INPUT ...]
+                        Required. Path to input image, images, video file or
+                        camera id.
+  -d DEVICE, --device DEVICE
+                        Optional. Specify the target device to infer on: CPU,
+                        GPU, FPGA, HDDL or MYRIAD. The demo will look for a
+                        suitable plugin for device specified (by default, it
+                        is CPU).
+  --height_size HEIGHT_SIZE
+                        Optional. Network input layer height size.
+  --extrinsics_path EXTRINSICS_PATH
+                        Optional. Path to file with camera extrinsics.
+  --fx FX               Optional. Camera focal length.
+  --no_show             Optional. Do not display output.
+
+```
+
+Running the application with an empty list of options yields the short version of the usage message and an error message.
+
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (`*.xml` + `*.bin`) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+To run the demo, please provide paths to the model in the IR format, and to an input video or image(s):
+```bash
+python human_pose_estination_3d_demo.py \
+-m /home/user/human-pose-estimation-3d-0001.xml \
+-i /home/user/video_name.mp4
+```
+
+## Demo Output
+
+The application uses OpenCV to display found poses and current inference performance.
+
+![](./data/human_pose_estimation_3d_demo.jpg)
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/data/extrinsics.json b/demos/python_demos/human_pose_estimation_3d_demo/data/extrinsics.json
new file mode 100644
index 00000000000..5f5c066dbc8
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/data/extrinsics.json
@@ -0,0 +1,30 @@
+{
+    "R": [
+        [
+            0.1656794936,
+            0.0336560618,
+            -0.9856051821
+        ],
+        [
+            -0.09224101321,
+            0.9955650135,
+            0.01849052095
+        ],
+        [
+            0.9818563545,
+            0.08784972047,
+            0.1680491765
+        ]
+    ],
+    "t": [
+        [
+            17.76193366
+        ],
+        [
+            126.741365
+        ],
+        [
+            286.3860507
+        ]
+    ]
+}
\ No newline at end of file
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/data/human_pose_estimation_3d_demo.jpg b/demos/python_demos/human_pose_estimation_3d_demo/data/human_pose_estimation_3d_demo.jpg
new file mode 100644
index 00000000000..b151c7a8284
Binary files /dev/null and b/demos/python_demos/human_pose_estimation_3d_demo/data/human_pose_estimation_3d_demo.jpg differ
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/human_pose_estimation_3d_demo.py b/demos/python_demos/human_pose_estimation_3d_demo/human_pose_estimation_3d_demo.py
new file mode 100644
index 00000000000..e9dab316bef
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/human_pose_estimation_3d_demo.py
@@ -0,0 +1,148 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from argparse import ArgumentParser, SUPPRESS
+import json
+import os
+
+import cv2
+import numpy as np
+
+from modules.inference_engine import InferenceEngine
+from modules.input_reader import InputReader
+from modules.draw import Plotter3d, draw_poses
+from modules.parse_poses import parse_poses
+
+
+def rotate_poses(poses_3d, R, t):
+    R_inv = np.linalg.inv(R)
+    for pose_id in range(poses_3d.shape[0]):
+        pose_3d = poses_3d[pose_id].reshape((-1, 4)).transpose()
+        pose_3d[0:3] = np.dot(R_inv, pose_3d[0:3] - t)
+        poses_3d[pose_id] = pose_3d.transpose().reshape(-1)
+
+    return poses_3d
+
+
+if __name__ == '__main__':
+    parser = ArgumentParser(description='Lightweight 3D human pose estimation demo. '
+                                        'Press esc to exit, "p" to (un)pause video or process next image.',
+                            add_help=False)
+    args = parser.add_argument_group('Options')
+    args.add_argument('-h', '--help', action='help', default=SUPPRESS,
+                      help='Show this help message and exit.')
+    args.add_argument('-m', '--model',
+                      help='Required. Path to an .xml file with a trained model.',
+                      type=str, required=True)
+    args.add_argument('-i', '--input',
+                      help='Required. Path to input image, images, video file or camera id.',
+                      nargs='+', default='')
+    args.add_argument('-d', '--device',
+                      help='Optional. Specify the target device to infer on: CPU, GPU, FPGA, HDDL or MYRIAD. '
+                           'The demo will look for a suitable plugin for device specified '
+                           '(by default, it is CPU).',
+                      type=str, default='CPU')
+    args.add_argument('--height_size', help='Optional. Network input layer height size.', type=int, default=256)
+    args.add_argument('--extrinsics_path',
+                      help='Optional. Path to file with camera extrinsics.',
+                      type=str, default=None)
+    args.add_argument('--fx', type=np.float32, default=-1, help='Optional. Camera focal length.')
+    args.add_argument('--no_show', help='Optional. Do not display output.', action='store_true')
+    args = parser.parse_args()
+
+    if args.input == '':
+        raise ValueError('Please, provide input data.')
+
+    stride = 8
+    inference_engine = InferenceEngine(args.model, args.device, stride)
+    canvas_3d = np.zeros((720, 1280, 3), dtype=np.uint8)
+    plotter = Plotter3d(canvas_3d.shape[:2])
+    canvas_3d_window_name = 'Canvas 3D'
+    if not args.no_show:
+        cv2.namedWindow(canvas_3d_window_name)
+        cv2.setMouseCallback(canvas_3d_window_name, Plotter3d.mouse_callback)
+
+    file_path = args.extrinsics_path
+    if file_path is None:
+        file_path = os.path.join(os.path.dirname(__file__), 'data', 'extrinsics.json')
+    with open(file_path, 'r') as f:
+        extrinsics = json.load(f)
+    R = np.array(extrinsics['R'], dtype=np.float32)
+    t = np.array(extrinsics['t'], dtype=np.float32)
+
+    frame_provider = InputReader(args.input)
+    is_video = frame_provider.is_video
+    base_height = args.height_size
+    fx = args.fx
+
+    delay = 1
+    esc_code = 27
+    p_code = 112
+    space_code = 32
+    mean_time = 0
+    for frame in frame_provider:
+        current_time = cv2.getTickCount()
+        input_scale = base_height / frame.shape[0]
+        scaled_img = cv2.resize(frame, dsize=None, fx=input_scale, fy=input_scale)
+        if fx < 0:  # Focal length is unknown
+            fx = np.float32(0.8 * frame.shape[1])
+
+        inference_result = inference_engine.infer(scaled_img)
+        poses_3d, poses_2d = parse_poses(inference_result, input_scale, stride, fx, is_video)
+        edges = []
+        if len(poses_3d) > 0:
+            poses_3d = rotate_poses(poses_3d, R, t)
+            poses_3d_copy = poses_3d.copy()
+            x = poses_3d_copy[:, 0::4]
+            y = poses_3d_copy[:, 1::4]
+            z = poses_3d_copy[:, 2::4]
+            poses_3d[:, 0::4], poses_3d[:, 1::4], poses_3d[:, 2::4] = -z, x, -y
+
+            poses_3d = poses_3d.reshape(poses_3d.shape[0], 19, -1)[:, :, 0:3]
+            edges = (Plotter3d.SKELETON_EDGES + 19 * np.arange(poses_3d.shape[0]).reshape((-1, 1, 1))).reshape((-1, 2))
+        plotter.plot(canvas_3d, poses_3d, edges)
+
+        draw_poses(frame, poses_2d)
+        current_time = (cv2.getTickCount() - current_time) / cv2.getTickFrequency()
+        if mean_time == 0:
+            mean_time = current_time
+        else:
+            mean_time = mean_time * 0.95 + current_time * 0.05
+        cv2.putText(frame, 'FPS: {}'.format(int(1 / mean_time * 10) / 10),
+                    (40, 80), cv2.FONT_HERSHEY_COMPLEX, 1, (0, 0, 255))
+        if args.no_show:
+            continue
+        cv2.imshow(canvas_3d_window_name, canvas_3d)
+        cv2.imshow('3D Human Pose Estimation', frame)
+
+        key = cv2.waitKey(delay)
+        if key == esc_code:
+            break
+        if key == p_code:
+            if delay == 1:
+                delay = 0
+            else:
+                delay = 1
+        if delay == 0 or not is_video:  # allow to rotate 3D canvas while on pause
+            key = 0
+            while (key != p_code
+                   and key != esc_code
+                   and key != space_code):
+                plotter.plot(canvas_3d, poses_3d, edges)
+                cv2.imshow(canvas_3d_window_name, canvas_3d)
+                key = cv2.waitKey(33)
+            if key == esc_code:
+                break
+            else:
+                delay = 1
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/models.lst b/demos/python_demos/human_pose_estimation_3d_demo/models.lst
new file mode 100644
index 00000000000..2739b07c84b
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/models.lst
@@ -0,0 +1,2 @@
+# This file can be used with the --list option of the model downloader.
+human-pose-estimation-3d-????
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/__init__.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/draw.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/draw.py
new file mode 100644
index 00000000000..b3a3b12889d
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/draw.py
@@ -0,0 +1,115 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import math
+
+import cv2
+import numpy as np
+
+
+previous_position = []
+theta, phi = math.pi / 4, -math.pi / 6
+should_rotate = False
+scale_dx = 800
+scale_dy = 800
+
+
+class Plotter3d:
+    SKELETON_EDGES = np.array([[11, 10], [10, 9], [9, 0], [0, 3], [3, 4], [4, 5], [0, 6], [6, 7], [7, 8], [0, 12],
+                               [12, 13], [13, 14], [0, 1], [1, 15], [15, 16], [1, 17], [17, 18]])
+
+    def __init__(self, canvas_size, origin=(0.5, 0.5), scale=1):
+        self.origin = np.array([origin[1] * canvas_size[1], origin[0] * canvas_size[0]], dtype=np.float32)  # x, y
+        self.scale = np.float32(scale)
+        self.theta = 0
+        self.phi = 0
+        axis_length = 200
+        axes = [
+            np.array([[-axis_length/2, -axis_length/2, 0], [axis_length/2, -axis_length/2, 0]], dtype=np.float32),
+            np.array([[-axis_length/2, -axis_length/2, 0], [-axis_length/2, axis_length/2, 0]], dtype=np.float32),
+            np.array([[-axis_length/2, -axis_length/2, 0], [-axis_length/2, -axis_length/2, axis_length]], dtype=np.float32)]
+        step = 20
+        for step_id in range(axis_length // step + 1):  # add grid
+            axes.append(np.array([[-axis_length / 2, -axis_length / 2 + step_id * step, 0],
+                                  [axis_length / 2, -axis_length / 2 + step_id * step, 0]], dtype=np.float32))
+            axes.append(np.array([[-axis_length / 2 + step_id * step, -axis_length / 2, 0],
+                                  [-axis_length / 2 + step_id * step, axis_length / 2, 0]], dtype=np.float32))
+        self.axes = np.array(axes)
+
+    def plot(self, img, vertices, edges):
+        global theta, phi
+        img.fill(0)
+        R = self._get_rotation(theta, phi)
+        self._draw_axes(img, R)
+        if len(edges) != 0:
+            self._plot_edges(img, vertices, edges, R)
+
+    def _draw_axes(self, img, R):
+        axes_2d = np.dot(self.axes, R)
+        axes_2d = axes_2d * self.scale + self.origin
+        for axe in axes_2d:
+            axe = axe.astype(int)
+            cv2.line(img, tuple(axe[0]), tuple(axe[1]), (128, 128, 128), 1, cv2.LINE_AA)
+
+    def _plot_edges(self, img, vertices, edges, R):
+        vertices_2d = np.dot(vertices, R)
+        edges_vertices = vertices_2d.reshape((-1, 2))[edges] * self.scale + self.origin
+        for edge_vertices in edges_vertices:
+            edge_vertices = edge_vertices.astype(int)
+            cv2.line(img, tuple(edge_vertices[0]), tuple(edge_vertices[1]), (255, 255, 255), 1, cv2.LINE_AA)
+
+    def _get_rotation(self, theta, phi):
+        sin, cos = math.sin, math.cos
+        return np.array([
+            [ cos(theta),  sin(theta) * sin(phi)],
+            [-sin(theta),  cos(theta) * sin(phi)],
+            [ 0,                       -cos(phi)]
+        ], dtype=np.float32)  # transposed
+
+    @staticmethod
+    def mouse_callback(event, x, y, flags, params):
+        global previous_position, theta, phi, should_rotate, scale_dx, scale_dy
+        if event == cv2.EVENT_LBUTTONDOWN:
+            previous_position = [x, y]
+            should_rotate = True
+        if event == cv2.EVENT_MOUSEMOVE and should_rotate:
+            theta += (x - previous_position[0]) / scale_dx * 2 * math.pi
+            phi -= (y - previous_position[1]) / scale_dy * 2 * math.pi * 2
+            phi = max(min(math.pi / 2, phi), -math.pi / 2)
+            previous_position = [x, y]
+        if event == cv2.EVENT_LBUTTONUP:
+            should_rotate = False
+
+
+body_edges = np.array(
+    [[0, 1],  # neck - nose
+     [1, 16], [16, 18],  # nose - l_eye - l_ear
+     [1, 15], [15, 17],  # nose - r_eye - r_ear
+     [0, 3], [3, 4], [4, 5],     # neck - l_shoulder - l_elbow - l_wrist
+     [0, 9], [9, 10], [10, 11],  # neck - r_shoulder - r_elbow - r_wrist
+     [0, 6], [6, 7], [7, 8],        # neck - l_hip - l_knee - l_ankle
+     [0, 12], [12, 13], [13, 14]])  # neck - r_hip - r_knee - r_ankle
+
+
+def draw_poses(img, poses_2d):
+    for pose in poses_2d:
+        pose = np.array(pose[0:-1]).reshape((-1, 3)).transpose()
+        was_found = pose[2] > 0
+        for edge in body_edges:
+            if was_found[edge[0]] and was_found[edge[1]]:
+                cv2.line(img, tuple(pose[0:2, edge[0]].astype(np.int32)), tuple(pose[0:2, edge[1]].astype(np.int32)),
+                         (255, 255, 0), 4, cv2.LINE_AA)
+        for kpt_id in range(pose.shape[1]):
+            if pose[2, kpt_id] != -1:
+                cv2.circle(img, tuple(pose[0:2, kpt_id].astype(np.int32)), 3, (0, 255, 255), -1, cv2.LINE_AA)
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/inference_engine.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/inference_engine.py
new file mode 100644
index 00000000000..cffad81ed40
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/inference_engine.py
@@ -0,0 +1,53 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import os
+
+import numpy as np
+
+from openvino.inference_engine import IENetwork, IECore
+
+
+class InferenceEngine:
+    def __init__(self, net_model_xml_path, device, stride):
+        self.device = device
+        self.stride = stride
+
+        net_model_bin_path = os.path.splitext(net_model_xml_path)[0] + '.bin'
+        self.net = IENetwork(model=net_model_xml_path, weights=net_model_bin_path)
+        required_input_key = {'data'}
+        assert required_input_key == set(self.net.inputs.keys()), \
+            'Demo supports only topologies with the following input key: {}'.format(', '.join(required_input_key))
+        required_output_keys = {'features', 'heatmaps', 'pafs'}
+        assert required_output_keys.issubset(self.net.outputs.keys()), \
+            'Demo supports only topologies with the following output keys: {}'.format(', '.join(required_output_keys))
+
+        self.ie = IECore()
+        self.exec_net = self.ie.load_network(network=self.net, num_requests=1, device_name=device)
+
+    def infer(self, img):
+        img = img[0:img.shape[0] - (img.shape[0] % self.stride),
+                  0:img.shape[1] - (img.shape[1] % self.stride)]
+        input_layer = next(iter(self.net.inputs))
+        n, c, h, w = self.net.inputs[input_layer].shape
+        if h != img.shape[0] or w != img.shape[1]:
+            self.net.reshape({input_layer: (n, c, img.shape[0], img.shape[1])})
+            self.exec_net = self.ie.load_network(network=self.net, num_requests=1, device_name=self.device)
+        img = np.transpose(img, (2, 0, 1))[None, ]
+
+        inference_result = self.exec_net.infer(inputs={'data': img})
+
+        inference_result = (inference_result['features'][0],
+                            inference_result['heatmaps'][0], inference_result['pafs'][0])
+        return inference_result
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/input_reader.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/input_reader.py
new file mode 100644
index 00000000000..98e38ab20cc
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/input_reader.py
@@ -0,0 +1,73 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import cv2
+
+
+class InputReader:
+    def __init__(self, file_names):
+        self.is_video = False
+        self._input_reader = ImageReader(file_names)
+        # check if video
+        img = cv2.imread(file_names[0], cv2.IMREAD_COLOR)
+        if img is None:
+            self.is_video = True
+            self._input_reader = VideoReader(file_names[0])
+
+    def __iter__(self):
+        return self._input_reader.__iter__()
+
+    def __next__(self):
+        return self._input_reader.__next__()
+
+
+class ImageReader:
+    def __init__(self, file_names):
+        self.file_names = file_names
+        self.max_idx = len(file_names)
+
+    def __iter__(self):
+        self.idx = 0
+        return self
+
+    def __next__(self):
+        if self.idx == self.max_idx:
+            raise StopIteration
+        img = cv2.imread(self.file_names[self.idx], cv2.IMREAD_COLOR)
+        if img.size == 0:
+            raise IOError('Image {} cannot be read'.format(self.file_names[self.idx]))
+        self.idx = self.idx + 1
+        return img
+
+
+class VideoReader:
+    def __init__(self, file_name):
+        try:  # OpenCV needs int to read from webcam
+            self.file_name = int(file_name)
+        except ValueError:
+            self.file_name = file_name
+
+    def __iter__(self):
+        self.cap = cv2.VideoCapture(self.file_name)
+        self.cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1920)
+        self.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 1080)
+        if not self.cap.isOpened():
+            raise IOError('Video {} cannot be opened'.format(self.file_name))
+        return self
+
+    def __next__(self):
+        was_read, img = self.cap.read()
+        if not was_read:
+            raise StopIteration
+        return img
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/one_euro_filter.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/one_euro_filter.py
new file mode 100644
index 00000000000..156279bbea8
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/one_euro_filter.py
@@ -0,0 +1,65 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import math
+
+
+def get_alpha(rate=30, cutoff=1):
+    tau = 1 / (2 * math.pi * cutoff)
+    te = 1 / rate
+    return 1 / (1 + tau / te)
+
+
+class LowPassFilter:
+    def __init__(self):
+        self.x_previous = None
+
+    def __call__(self, x, alpha=0.5):
+        if self.x_previous is None:
+            self.x_previous = x
+            return x
+        x_filtered = alpha * x + (1 - alpha) * self.x_previous
+        self.x_previous = x_filtered
+        return x_filtered
+
+
+class OneEuroFilter:
+    def __init__(self, freq=15, mincutoff=1, beta=1, dcutoff=1):
+        self.freq = freq
+        self.mincutoff = mincutoff
+        self.beta = beta
+        self.dcutoff = dcutoff
+        self.filter_x = LowPassFilter()
+        self.filter_dx = LowPassFilter()
+        self.x_previous = None
+        self.dx = None
+
+    def __call__(self, x):
+        if self.dx is None:
+            self.dx = 0
+        else:
+            self.dx = (x - self.x_previous) * self.freq
+        dx_smoothed = self.filter_dx(self.dx, get_alpha(self.freq, self.dcutoff))
+        cutoff = self.mincutoff + self.beta * abs(dx_smoothed)
+        x_filtered = self.filter_x(x, get_alpha(self.freq, cutoff))
+        self.x_previous = x
+        return x_filtered
+
+
+if __name__ == '__main__':
+    filter = OneEuroFilter(freq=15, beta=0.1)
+    for val in range(10):
+        x = val + (-1)**(val % 2)
+        x_filtered = filter(x)
+        print(x_filtered, x)
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/parse_poses.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/parse_poses.py
new file mode 100644
index 00000000000..dc16c238415
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/parse_poses.py
@@ -0,0 +1,161 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import numpy as np
+
+from modules.pose import Pose, propagate_ids
+from pose_extractor import extract_poses
+
+AVG_PERSON_HEIGHT = 180
+
+# pelvis (body center) is missing, id == 2
+map_id_to_panoptic = [1, 0, 9, 10, 11, 3, 4, 5, 12, 13, 14, 6, 7, 8, 15, 16, 17, 18]
+
+limbs = [[18, 17, 1],
+         [16, 15, 1],
+         [5, 4, 3],
+         [8, 7, 6],
+         [11, 10, 9],
+         [14, 13, 12]]
+
+
+def get_root_relative_poses(inference_results):
+    features, heatmap, paf_map = inference_results
+
+    upsample_ratio = 4
+    found_poses = extract_poses(heatmap[0:-1], paf_map, upsample_ratio)
+    # scale coordinates to features space
+    found_poses[:, 0:-1:3] /= upsample_ratio
+    found_poses[:, 1:-1:3] /= upsample_ratio
+
+    poses_2d = []
+    num_kpt_panoptic = 19
+    num_kpt = 18
+    for pose_id in range(found_poses.shape[0]):
+        if found_poses[pose_id, 5] == -1:  # skip pose if does not found neck
+            continue
+        pose_2d = np.ones(num_kpt_panoptic * 3 + 1, dtype=np.float32) * -1  # +1 for pose confidence
+        for kpt_id in range(num_kpt):
+            if found_poses[pose_id, kpt_id * 3] != -1:
+                x_2d, y_2d, conf = found_poses[pose_id, kpt_id * 3:(kpt_id + 1) * 3]
+                pose_2d[map_id_to_panoptic[kpt_id] * 3] = x_2d  # just repacking
+                pose_2d[map_id_to_panoptic[kpt_id] * 3 + 1] = y_2d
+                pose_2d[map_id_to_panoptic[kpt_id] * 3 + 2] = conf
+        pose_2d[-1] = found_poses[pose_id, -1]
+        poses_2d.append(pose_2d)
+    poses_2d = np.array(poses_2d)
+
+    keypoint_treshold = 0.1
+    poses_3d = np.ones((len(poses_2d), num_kpt_panoptic * 4), dtype=np.float32) * -1
+    for pose_id in range(poses_3d.shape[0]):
+        if poses_2d[pose_id, 2] <= keypoint_treshold:
+            continue
+        pose_3d = poses_3d[pose_id]
+        neck_2d = poses_2d[pose_id, 0:2].astype(np.int32)
+        # read all pose coordinates at neck location
+        for kpt_id in range(num_kpt_panoptic):
+            map_3d = features[kpt_id * 3:(kpt_id + 1) * 3]
+            pose_3d[kpt_id * 4] = map_3d[0, neck_2d[1], neck_2d[0]]
+            pose_3d[kpt_id * 4 + 1] = map_3d[1, neck_2d[1], neck_2d[0]]
+            pose_3d[kpt_id * 4 + 2] = map_3d[2, neck_2d[1], neck_2d[0]]
+            pose_3d[kpt_id * 4 + 3] = poses_2d[pose_id, kpt_id * 3 + 2]
+
+        # refine keypoints coordinates at corresponding limbs locations
+        for limb in limbs:
+            for kpt_id_from in limb:
+                if poses_2d[pose_id, kpt_id_from * 3 + 2] <= keypoint_treshold:
+                    continue
+                for kpt_id_where in limb:
+                    kpt_from_2d = poses_2d[pose_id, kpt_id_from * 3:kpt_id_from * 3 + 2].astype(np.int32)
+                    map_3d = features[kpt_id_where * 3:(kpt_id_where + 1) * 3]
+                    pose_3d[kpt_id_where * 4] = map_3d[0, kpt_from_2d[1], kpt_from_2d[0]]
+                    pose_3d[kpt_id_where * 4 + 1] = map_3d[1, kpt_from_2d[1], kpt_from_2d[0]]
+                    pose_3d[kpt_id_where * 4 + 2] = map_3d[2, kpt_from_2d[1], kpt_from_2d[0]]
+                break
+
+    poses_3d[:, 0::4] *= AVG_PERSON_HEIGHT
+    poses_3d[:, 1::4] *= AVG_PERSON_HEIGHT
+    poses_3d[:, 2::4] *= AVG_PERSON_HEIGHT
+    return poses_3d, poses_2d
+
+
+previous_poses_2d = []
+
+
+def parse_poses(inference_results, input_scale, stride, fx, is_video=False):
+    global previous_poses_2d
+    features = inference_results[0]
+    poses_3d, poses_2d = get_root_relative_poses(inference_results)
+    poses_2d_scaled = []
+    for pose_2d in poses_2d:
+        num_kpt = (pose_2d.shape[0] - 1) // 3
+        pose_2d_scaled = np.ones(pose_2d.shape[0], dtype=np.float32) * -1
+        for kpt_id in range(num_kpt):
+            if pose_2d[kpt_id * 3] != -1:
+                pose_2d_scaled[kpt_id * 3] = pose_2d[kpt_id * 3] * stride / input_scale
+                pose_2d_scaled[kpt_id * 3 + 1] = pose_2d[kpt_id * 3 + 1] * stride / input_scale
+                pose_2d_scaled[kpt_id * 3 + 2] = pose_2d[kpt_id * 3 + 2]
+        pose_2d_scaled[-1] = pose_2d[-1]
+        poses_2d_scaled.append(pose_2d_scaled)
+
+    if is_video:  # track poses ids
+        current_poses_2d = []
+        for pose_2d_scaled in poses_2d_scaled:
+            pose_keypoints = np.ones((Pose.num_kpts, 2), dtype=np.int32) * -1
+            for kpt_id in range(Pose.num_kpts):
+                if pose_2d_scaled[kpt_id * 3] != -1.0:  # keypoint was found
+                    pose_keypoints[kpt_id, 0:2] = pose_2d_scaled[kpt_id * 3:kpt_id * 3 + 2].astype(np.int32)
+            pose = Pose(pose_keypoints, pose_2d_scaled[-1])
+            current_poses_2d.append(pose)
+        propagate_ids(previous_poses_2d, current_poses_2d)
+        previous_poses_2d = current_poses_2d
+
+    translated_poses_3d = []
+    # translate poses
+    for pose_id in range(poses_3d.shape[0]):
+        pose_3d = poses_3d[pose_id].reshape((-1, 4)).transpose()
+        pose_2d = poses_2d[pose_id][0:-1].reshape((-1, 3)).transpose()
+        num_valid = np.count_nonzero(pose_2d[2] != -1)
+        pose_3d_valid = np.zeros((3, num_valid), dtype=np.float32)
+        pose_2d_valid = np.zeros((2, num_valid), dtype=np.float32)
+        valid_id = 0
+        for kpt_id in range(pose_3d.shape[1]):
+            if pose_2d[2, kpt_id] == -1:
+                continue
+            pose_3d_valid[:, valid_id] = pose_3d[0:3, kpt_id]
+            pose_2d_valid[:, valid_id] = pose_2d[0:2, kpt_id]
+            valid_id += 1
+
+        pose_2d_valid[0] = pose_2d_valid[0] - features.shape[2]/2
+        pose_2d_valid[1] = pose_2d_valid[1] - features.shape[1]/2
+        mean_3d = np.expand_dims(pose_3d_valid.mean(axis=1), axis=1)
+        mean_2d = np.expand_dims(pose_2d_valid.mean(axis=1), axis=1)
+        numerator = np.trace(np.dot((pose_3d_valid[0:2] - mean_3d[0:2]).transpose(),
+                                    pose_3d_valid[0:2] - mean_3d[0:2])).sum()
+        numerator = np.sqrt(numerator)
+        denominator = np.sqrt(np.trace(np.dot((pose_2d_valid[0:2] - mean_2d[0:2]).transpose(),
+                                              pose_2d_valid[0:2] - mean_2d[0:2])).sum())
+        mean_2d = np.array([mean_2d[0, 0], mean_2d[1, 0], fx * input_scale / stride])
+        mean_3d = np.array([mean_3d[0, 0], mean_3d[1, 0], 0])
+        translation = numerator / denominator * mean_2d - mean_3d
+
+        if is_video:
+            translation = current_poses_2d[pose_id].filter(translation)
+        for kpt_id in range(19):
+            pose_3d[0, kpt_id] = pose_3d[0, kpt_id] + translation[0]
+            pose_3d[1, kpt_id] = pose_3d[1, kpt_id] + translation[1]
+            pose_3d[2, kpt_id] = pose_3d[2, kpt_id] + translation[2]
+        translated_poses_3d.append(pose_3d.transpose().reshape(-1))
+
+    return np.array(translated_poses_3d), np.array(poses_2d_scaled)
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/modules/pose.py b/demos/python_demos/human_pose_estimation_3d_demo/modules/pose.py
new file mode 100644
index 00000000000..c98850199b1
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/modules/pose.py
@@ -0,0 +1,107 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+      http://www.apache.org/licenses/LICENSE-2.0
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import cv2
+import numpy as np
+
+from modules.one_euro_filter import OneEuroFilter
+
+
+class Pose:
+    num_kpts = 18
+    kpt_names = ['neck', 'nose',
+                 'l_sho', 'l_elb', 'l_wri', 'l_hip', 'l_knee', 'l_ank',
+                 'r_sho', 'r_elb', 'r_wri', 'r_hip', 'r_knee', 'r_ank',
+                 'r_eye', 'l_eye',
+                 'r_ear', 'l_ear']
+    sigmas = np.array([.79, .26, .79, .72, .62, 1.07, .87, .89, .79, .72, .62, 1.07, .87, .89, .25, .25, .35, .35],
+                      dtype=np.float32) / 10.0
+    vars = (sigmas * 2) ** 2
+    last_id = -1
+    color = [0, 224, 255]
+
+    def __init__(self, keypoints, confidence):
+        super().__init__()
+        self.keypoints = keypoints
+        self.confidence = confidence
+        found_keypoints = np.zeros((np.count_nonzero(keypoints[:, 0] != -1), 2), dtype=np.int32)
+        found_kpt_id = 0
+        for kpt_id in range(keypoints.shape[0]):
+            if keypoints[kpt_id, 0] == -1:
+                continue
+            found_keypoints[found_kpt_id] = keypoints[kpt_id]
+            found_kpt_id += 1
+        self.bbox = cv2.boundingRect(found_keypoints)
+        self.id = None
+        self.translation_filter = [OneEuroFilter(freq=80, beta=0.01),
+                                   OneEuroFilter(freq=80, beta=0.01),
+                                   OneEuroFilter(freq=80, beta=0.01)]
+
+    def update_id(self, id=None):
+        self.id = id
+        if self.id is None:
+            self.id = Pose.last_id + 1
+            Pose.last_id += 1
+
+    def filter(self, translation):
+        filtered_translation = []
+        for coordinate_id in range(3):
+            filtered_translation.append(self.translation_filter[coordinate_id](translation[coordinate_id]))
+        return filtered_translation
+
+
+def get_similarity(a, b, threshold=0.5):
+    num_similar_kpt = 0
+    for kpt_id in range(Pose.num_kpts):
+        if a.keypoints[kpt_id, 0] != -1 and b.keypoints[kpt_id, 0] != -1:
+            distance = np.sum((a.keypoints[kpt_id] - b.keypoints[kpt_id]) ** 2)
+            area = max(a.bbox[2] * a.bbox[3], b.bbox[2] * b.bbox[3])
+            similarity = np.exp(-distance / (2 * (area + np.spacing(1)) * Pose.vars[kpt_id]))
+            if similarity > threshold:
+                num_similar_kpt += 1
+    return num_similar_kpt
+
+
+def propagate_ids(previous_poses, current_poses, threshold=3):
+    """Propagate poses ids from previous frame results. Id is propagated,
+    if there are at least `threshold` similar keypoints between pose from previous frame and current.
+
+    :param previous_poses: poses from previous frame with ids
+    :param current_poses: poses from current frame to assign ids
+    :param threshold: minimal number of similar keypoints between poses
+    :return: None
+    """
+    current_poses_sorted_ids = list(range(len(current_poses)))
+    current_poses_sorted_ids = sorted(
+        current_poses_sorted_ids, key=lambda pose_id: current_poses[pose_id].confidence, reverse=True)  # match confident poses first
+    mask = np.ones(len(previous_poses), dtype=np.int32)
+    for current_pose_id in current_poses_sorted_ids:
+        best_matched_id = None
+        best_matched_pose_id = None
+        best_matched_iou = 0
+        for previous_pose_id in range(len(previous_poses)):
+            if not mask[previous_pose_id]:
+                continue
+            iou = get_similarity(current_poses[current_pose_id], previous_poses[previous_pose_id])
+            if iou > best_matched_iou:
+                best_matched_iou = iou
+                best_matched_pose_id = previous_poses[previous_pose_id].id
+                best_matched_id = previous_pose_id
+        if best_matched_iou >= threshold:
+            mask[best_matched_id] = 0
+        else:  # pose not similar to any previous
+            best_matched_pose_id = None
+        current_poses[current_pose_id].update_id(best_matched_pose_id)
+        if best_matched_pose_id is not None:
+            current_poses[current_pose_id].translation_filter = previous_poses[best_matched_id].translation_filter
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/CMakeLists.txt b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/CMakeLists.txt
new file mode 100644
index 00000000000..781b5f1d58b
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/CMakeLists.txt
@@ -0,0 +1,27 @@
+# Copyright (C) 2018-2019 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+#
+
+execute_process(
+    COMMAND "${PYTHON_EXECUTABLE}" -c "import numpy; print(numpy.get_include())"
+    OUTPUT_VARIABLE NUMPY_INCLUDE_DIR
+    OUTPUT_STRIP_TRAILING_WHITESPACE
+    RESULT_VARIABLE NUMPY_NOT_FOUND)
+if(NUMPY_NOT_FOUND)
+    message(FATAL_ERROR "NumPy headers not found")
+endif()
+
+find_package(OpenCV 4 REQUIRED)
+
+set(target_name pose_extractor)
+add_library(${target_name} MODULE wrapper.cpp
+                                  src/extract_poses.hpp src/extract_poses.cpp
+                                  src/human_pose.hpp src/human_pose.cpp
+                                  src/peak.hpp src/peak.cpp)
+target_include_directories(${target_name} PRIVATE src/ ${PYTHON_INCLUDE_DIRS} ${NUMPY_INCLUDE_DIR} ${OpenCV_INCLUDE_DIRS})
+target_link_libraries(${target_name} ${PYTHON_LIBRARIES} ${OpenCV_LIBS})
+set_target_properties(${target_name} PROPERTIES PREFIX "" OUTPUT_NAME "${target_name}")
+if(WIN32)
+    set_target_properties(${target_name} PROPERTIES SUFFIX ".pyd")
+endif()
+
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.cpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.cpp
new file mode 100644
index 00000000000..cfa871d22f8
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.cpp
@@ -0,0 +1,66 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <opencv2/imgproc/imgproc.hpp>
+
+#include "extract_poses.hpp"
+#include "peak.hpp"
+
+namespace human_pose_estimation {
+static void resizeFeatureMaps(std::vector<cv::Mat>& featureMaps, int upsampleRatio) {
+    for (auto& featureMap : featureMaps) {
+        cv::resize(featureMap, featureMap, cv::Size(),
+                   upsampleRatio, upsampleRatio, cv::INTER_CUBIC);
+    }
+}
+
+class FindPeaksBody: public cv::ParallelLoopBody {
+public:
+    FindPeaksBody(const std::vector<cv::Mat>& heatMaps, float minPeaksDistance,
+                  std::vector<std::vector<Peak> >& peaksFromHeatMap)
+        : heatMaps(heatMaps),
+          minPeaksDistance(minPeaksDistance),
+          peaksFromHeatMap(peaksFromHeatMap) {}
+
+    virtual void operator()(const cv::Range& range) const {
+        for (int i = range.start; i < range.end; i++) {
+            findPeaks(heatMaps, minPeaksDistance, peaksFromHeatMap, i);
+        }
+    }
+
+private:
+    const std::vector<cv::Mat>& heatMaps;
+    float minPeaksDistance;
+    std::vector<std::vector<Peak> >& peaksFromHeatMap;
+};
+
+std::vector<HumanPose> extractPoses(
+        std::vector<cv::Mat>& heatMaps,
+        std::vector<cv::Mat>& pafs,
+        int upsampleRatio) {
+    resizeFeatureMaps(heatMaps, upsampleRatio);
+    resizeFeatureMaps(pafs, upsampleRatio);
+    std::vector<std::vector<Peak> > peaksFromHeatMap(heatMaps.size());
+    float minPeaksDistance = 3.0f;
+    FindPeaksBody findPeaksBody(heatMaps, minPeaksDistance, peaksFromHeatMap);
+    cv::parallel_for_(cv::Range(0, static_cast<int>(heatMaps.size())),
+                      findPeaksBody);
+    int peaksBefore = 0;
+    for (size_t heatmapId = 1; heatmapId < heatMaps.size(); heatmapId++) {
+        peaksBefore += static_cast<int>(peaksFromHeatMap[heatmapId - 1].size());
+        for (auto& peak : peaksFromHeatMap[heatmapId]) {
+            peak.id += peaksBefore;
+        }
+    }
+    int keypointsNumber = 18;
+    float midPointsScoreThreshold = 0.05f;
+    float foundMidPointsRatioThreshold = 0.8f;
+    int minJointsNumber = 3;
+    float minSubsetScore = 0.2f;
+    std::vector<HumanPose> poses = groupPeaksToPoses(
+                peaksFromHeatMap, pafs, keypointsNumber, midPointsScoreThreshold,
+                foundMidPointsRatioThreshold, minJointsNumber, minSubsetScore);
+    return poses;
+}
+} // namespace human_pose_estimation
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.hpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.hpp
new file mode 100644
index 00000000000..e9658656c73
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/extract_poses.hpp
@@ -0,0 +1,16 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include <opencv2/core/core.hpp>
+
+#include "human_pose.hpp"
+
+namespace human_pose_estimation {
+std::vector<HumanPose> extractPoses(
+        std::vector<cv::Mat>& heatMaps,
+        std::vector<cv::Mat>& pafs,
+        int upsampleRatio);
+} // namespace human_pose_estimation
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.cpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.cpp
new file mode 100644
index 00000000000..05c7e92989c
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.cpp
@@ -0,0 +1,15 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <vector>
+
+#include "human_pose.hpp"
+
+namespace human_pose_estimation {
+HumanPose::HumanPose(const std::vector<cv::Point3f>& keypoints,
+                     const float& score)
+    : keypoints(keypoints),
+      score(score) {}
+} // namespace human_pose_estimation
+
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.hpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.hpp
new file mode 100644
index 00000000000..75abc562096
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/human_pose.hpp
@@ -0,0 +1,20 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include <opencv2/core/core.hpp>
+
+namespace human_pose_estimation {
+struct HumanPose {
+    HumanPose(const std::vector<cv::Point3f>& keypoints = std::vector<cv::Point3f>(),
+              const float& score = 0);
+
+    std::vector<cv::Point3f> keypoints;
+    float score;
+};
+} // namespace human_pose_estimation
+
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.cpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.cpp
new file mode 100644
index 00000000000..757af16fc8d
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.cpp
@@ -0,0 +1,327 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <algorithm>
+#include <utility>
+#include <vector>
+
+#include "peak.hpp"
+
+namespace human_pose_estimation {
+Peak::Peak(const int id, const cv::Point2f& pos, const float score)
+    : id(id),
+      pos(pos),
+      score(score) {}
+
+HumanPoseByPeaksIndices::HumanPoseByPeaksIndices(const int keypointsNumber)
+    : peaksIndices(std::vector<int>(keypointsNumber, -1)),
+      nJoints(0),
+      score(0.0f) {}
+
+TwoJointsConnection::TwoJointsConnection(const int firstJointIdx,
+                                         const int secondJointIdx,
+                                         const float score)
+    : firstJointIdx(firstJointIdx),
+      secondJointIdx(secondJointIdx),
+      score(score) {}
+
+void findPeaks(const std::vector<cv::Mat>& heatMaps,
+               const float minPeaksDistance,
+               std::vector<std::vector<Peak> >& allPeaks,
+               int heatMapId) {
+    const float threshold = 0.1f;
+    std::vector<cv::Point> peaks;
+    const cv::Mat& heatMap = heatMaps[heatMapId];
+    const float* heatMapData = heatMap.ptr<float>();
+    size_t heatMapStep = heatMap.step1();
+    for (int y = -1; y < heatMap.rows + 1; y++) {
+        for (int x = -1; x < heatMap.cols + 1; x++) {
+            float val = 0;
+            if (x >= 0
+                    && y >= 0
+                    && x < heatMap.cols
+                    && y < heatMap.rows) {
+                val = heatMapData[y * heatMapStep + x];
+                val = val >= threshold ? val : 0;
+            }
+
+            float left_val = 0;
+            if (y >= 0
+                    && x < (heatMap.cols - 1)
+                    && y < heatMap.rows) {
+                left_val = heatMapData[y * heatMapStep + x + 1];
+                left_val = left_val >= threshold ? left_val : 0;
+            }
+
+            float right_val = 0;
+            if (x > 0
+                    && y >= 0
+                    && y < heatMap.rows) {
+                right_val = heatMapData[y * heatMapStep + x - 1];
+                right_val = right_val >= threshold ? right_val : 0;
+            }
+
+            float top_val = 0;
+            if (x >= 0
+                    && x < heatMap.cols
+                    && y < (heatMap.rows - 1)) {
+                top_val = heatMapData[(y + 1) * heatMapStep + x];
+                top_val = top_val >= threshold ? top_val : 0;
+            }
+
+            float bottom_val = 0;
+            if (x >= 0
+                    && y > 0
+                    && x < heatMap.cols) {
+                bottom_val = heatMapData[(y - 1) * heatMapStep + x];
+                bottom_val = bottom_val >= threshold ? bottom_val : 0;
+            }
+
+            if ((val > left_val)
+                    && (val > right_val)
+                    && (val > top_val)
+                    && (val > bottom_val)) {
+                peaks.push_back(cv::Point(x, y));
+            }
+        }
+    }
+    std::sort(peaks.begin(), peaks.end(), [](const cv::Point& a, const cv::Point& b) {
+        return a.x < b.x;
+    });
+    std::vector<bool> isActualPeak(peaks.size(), true);
+    int peakCounter = 0;
+    std::vector<Peak>& peaksWithScoreAndID = allPeaks[heatMapId];
+    for (size_t i = 0; i < peaks.size(); i++) {
+        if (isActualPeak[i]) {
+            for (size_t j = i + 1; j < peaks.size(); j++) {
+                if (sqrt((peaks[i].x - peaks[j].x) * (peaks[i].x - peaks[j].x) +
+                         (peaks[i].y - peaks[j].y) * (peaks[i].y - peaks[j].y)) < minPeaksDistance) {
+                    isActualPeak[j] = false;
+                }
+            }
+            peaksWithScoreAndID.push_back(Peak(peakCounter++, peaks[i], heatMap.at<float>(peaks[i])));
+        }
+    }
+}
+
+std::vector<HumanPose> groupPeaksToPoses(const std::vector<std::vector<Peak> >& allPeaks,
+                                         const std::vector<cv::Mat>& pafs,
+                                         const size_t keypointsNumber,
+                                         const float midPointsScoreThreshold,
+                                         const float foundMidPointsRatioThreshold,
+                                         const int minJointsNumber,
+                                         const float minSubsetScore) {
+    static const std::pair<int, int> limbIdsHeatmap[] = {
+        {2, 3}, {2, 6}, {3, 4}, {4, 5}, {6, 7}, {7, 8}, {2, 9}, {9, 10}, {10, 11}, {2, 12}, {12, 13}, {13, 14},
+        {2, 1}, {1, 15}, {15, 17}, {1, 16}, {16, 18}, {3, 17}, {6, 18}
+    };
+    static const std::pair<int, int> limbIdsPaf[] = {
+        {31, 32}, {39, 40}, {33, 34}, {35, 36}, {41, 42}, {43, 44}, {19, 20}, {21, 22}, {23, 24}, {25, 26},
+        {27, 28}, {29, 30}, {47, 48}, {49, 50}, {53, 54}, {51, 52}, {55, 56}, {37, 38}, {45, 46}
+    };
+
+    std::vector<Peak> candidates;
+    for (const auto& peaks : allPeaks) {
+         candidates.insert(candidates.end(), peaks.begin(), peaks.end());
+    }
+    std::vector<HumanPoseByPeaksIndices> subset(0, HumanPoseByPeaksIndices(static_cast<int>(keypointsNumber)));
+    for (size_t k = 0; k < sizeof(limbIdsPaf) / sizeof(*limbIdsPaf); k++) {
+        std::vector<TwoJointsConnection> connections;
+        const int mapIdxOffset = static_cast<int>(keypointsNumber) + 1;
+        std::pair<cv::Mat, cv::Mat> scoreMid = { pafs[limbIdsPaf[k].first - mapIdxOffset],
+                                                 pafs[limbIdsPaf[k].second - mapIdxOffset] };
+        const int idxJointA = limbIdsHeatmap[k].first - 1;
+        const int idxJointB = limbIdsHeatmap[k].second - 1;
+        const std::vector<Peak>& candA = allPeaks[idxJointA];
+        const std::vector<Peak>& candB = allPeaks[idxJointB];
+        const size_t nJointsA = candA.size();
+        const size_t nJointsB = candB.size();
+        if (nJointsA == 0
+                && nJointsB == 0) {
+            continue;
+        } else if (nJointsA == 0) {
+            for (size_t i = 0; i < nJointsB; i++) {
+                int num = 0;
+                for (size_t j = 0; j < subset.size(); j++) {
+                    if (subset[j].peaksIndices[idxJointB] == candB[i].id) {
+                        num++;
+                        continue;
+                    }
+                }
+                if (num == 0) {
+                    HumanPoseByPeaksIndices personKeypoints(static_cast<int>(keypointsNumber));
+                    personKeypoints.peaksIndices[idxJointB] = candB[i].id;
+                    personKeypoints.nJoints = 1;
+                    personKeypoints.score = candB[i].score;
+                    subset.push_back(personKeypoints);
+                }
+            }
+            continue;
+        } else if (nJointsB == 0) {
+            for (size_t i = 0; i < nJointsA; i++) {
+                int num = 0;
+                for (size_t j = 0; j < subset.size(); j++) {
+                    if (subset[j].peaksIndices[idxJointA] == candA[i].id) {
+                        num++;
+                        continue;
+                    }
+                }
+                if (num == 0) {
+                    HumanPoseByPeaksIndices personKeypoints(static_cast<int>(keypointsNumber));
+                    personKeypoints.peaksIndices[idxJointA] = candA[i].id;
+                    personKeypoints.nJoints = 1;
+                    personKeypoints.score = candA[i].score;
+                    subset.push_back(personKeypoints);
+                }
+            }
+            continue;
+        }
+
+        std::vector<TwoJointsConnection> tempJointConnections;
+        for (size_t i = 0; i < nJointsA; i++) {
+            for (size_t j = 0; j < nJointsB; j++) {
+                cv::Point2f pt = candA[i].pos * 0.5 + candB[j].pos * 0.5;
+                cv::Point mid = cv::Point(cvRound(pt.x), cvRound(pt.y));
+                cv::Point2f vec = candB[j].pos - candA[i].pos;
+                double norm_vec = cv::norm(vec);
+                if (norm_vec == 0) {
+                    continue;
+                }
+                vec /= norm_vec;
+                float score = vec.x * scoreMid.first.at<float>(mid) + vec.y * scoreMid.second.at<float>(mid);
+                int height_n  = pafs[0].rows / 2;
+                float suc_ratio = 0.0f;
+                float mid_score = 0.0f;
+                const int mid_num = 10;
+                const float scoreThreshold = -100.0f;
+                if (score > scoreThreshold) {
+                    float p_sum = 0;
+                    int p_count = 0;
+                    cv::Size2f step((candB[j].pos.x - candA[i].pos.x)/(mid_num - 1),
+                                    (candB[j].pos.y - candA[i].pos.y)/(mid_num - 1));
+                    for (int n = 0; n < mid_num; n++) {
+                        cv::Point midPoint(cvRound(candA[i].pos.x + n * step.width),
+                                           cvRound(candA[i].pos.y + n * step.height));
+                        cv::Point2f pred(scoreMid.first.at<float>(midPoint),
+                                         scoreMid.second.at<float>(midPoint));
+                        score = vec.x * pred.x + vec.y * pred.y;
+                        if (score > midPointsScoreThreshold) {
+                            p_sum += score;
+                            p_count++;
+                        }
+                    }
+                    suc_ratio = static_cast<float>(p_count / mid_num);
+                    float ratio = p_count > 0 ? p_sum / p_count : 0.0f;
+                    mid_score = ratio + static_cast<float>(std::min(height_n / norm_vec - 1, 0.0));
+                }
+                if (mid_score > 0
+                        && suc_ratio > foundMidPointsRatioThreshold) {
+                    tempJointConnections.push_back(TwoJointsConnection(static_cast<int>(i), static_cast<int>(j), mid_score));
+                }
+            }
+        }
+        if (!tempJointConnections.empty()) {
+            std::sort(tempJointConnections.begin(), tempJointConnections.end(),
+                      [](const TwoJointsConnection& a,
+                         const TwoJointsConnection& b) {
+                return (a.score > b.score);
+            });
+        }
+        size_t num_limbs = std::min(nJointsA, nJointsB);
+        size_t cnt = 0;
+        std::vector<int> occurA(nJointsA, 0);
+        std::vector<int> occurB(nJointsB, 0);
+        for (size_t row = 0; row < tempJointConnections.size(); row++) {
+            if (cnt == num_limbs) {
+                break;
+            }
+            const int& indexA = tempJointConnections[row].firstJointIdx;
+            const int& indexB = tempJointConnections[row].secondJointIdx;
+            const float& score = tempJointConnections[row].score;
+            if (occurA[indexA] == 0
+                    && occurB[indexB] == 0) {
+                connections.push_back(TwoJointsConnection(candA[indexA].id, candB[indexB].id, score));
+                cnt++;
+                occurA[indexA] = 1;
+                occurB[indexB] = 1;
+            }
+        }
+        if (connections.empty()) {
+            continue;
+        }
+
+        bool extraJointConnections = (k == 17 || k == 18);
+        if (k == 0) {
+            subset = std::vector<HumanPoseByPeaksIndices>(
+                        connections.size(), HumanPoseByPeaksIndices(static_cast<int>(keypointsNumber)));
+            for (size_t i = 0; i < connections.size(); i++) {
+                const int& indexA = connections[i].firstJointIdx;
+                const int& indexB = connections[i].secondJointIdx;
+                subset[i].peaksIndices[idxJointA] = indexA;
+                subset[i].peaksIndices[idxJointB] = indexB;
+                subset[i].nJoints = 2;
+                subset[i].score = candidates[indexA].score + candidates[indexB].score + connections[i].score;
+            }
+        } else if (extraJointConnections) {
+            for (size_t i = 0; i < connections.size(); i++) {
+                const int& indexA = connections[i].firstJointIdx;
+                const int& indexB = connections[i].secondJointIdx;
+                for (size_t j = 0; j < subset.size(); j++) {
+                    if (subset[j].peaksIndices[idxJointA] == indexA
+                            && subset[j].peaksIndices[idxJointB] == -1) {
+                        subset[j].peaksIndices[idxJointB] = indexB;
+                    } else if (subset[j].peaksIndices[idxJointB] == indexB
+                                && subset[j].peaksIndices[idxJointA] == -1) {
+                        subset[j].peaksIndices[idxJointA] = indexA;
+                    }
+                }
+            }
+            continue;
+        } else {
+            for (size_t i = 0; i < connections.size(); i++) {
+                const int& indexA = connections[i].firstJointIdx;
+                const int& indexB = connections[i].secondJointIdx;
+                bool num = false;
+                for (size_t j = 0; j < subset.size(); j++) {
+                    if (subset[j].peaksIndices[idxJointA] == indexA) {
+                        subset[j].peaksIndices[idxJointB] = indexB;
+                        subset[j].nJoints++;
+                        subset[j].score += candidates[indexB].score + connections[i].score;
+                        num = true;
+                    }
+                }
+                if (!num) {
+                    HumanPoseByPeaksIndices hpWithScore(static_cast<int>(keypointsNumber));
+                    hpWithScore.peaksIndices[idxJointA] = indexA;
+                    hpWithScore.peaksIndices[idxJointB] = indexB;
+                    hpWithScore.nJoints = 2;
+                    hpWithScore.score = candidates[indexA].score + candidates[indexB].score + connections[i].score;
+                    subset.push_back(hpWithScore);
+                }
+            }
+        }
+    }
+    std::vector<HumanPose> poses;
+    for (const auto& subsetI : subset) {
+        if (subsetI.nJoints < minJointsNumber
+                || subsetI.score / subsetI.nJoints < minSubsetScore) {
+            continue;
+        }
+        int position = -1;
+        HumanPose pose(std::vector<cv::Point3f>(keypointsNumber, cv::Point3f(-1.0f, -1.0f, -1.0f)),
+                       subsetI.score * std::max(0, subsetI.nJoints - 1));
+        for (const auto& peakIdx : subsetI.peaksIndices) {
+            position++;
+            if (peakIdx >= 0) {
+                pose.keypoints[position].x = candidates[peakIdx].pos.x + 0.5f;
+                pose.keypoints[position].y = candidates[peakIdx].pos.y + 0.5f;
+                pose.keypoints[position].z = candidates[peakIdx].score;
+            }
+        }
+        poses.push_back(pose);
+    }
+    return poses;
+}
+} // namespace human_pose_estimation
+
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.hpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.hpp
new file mode 100644
index 00000000000..823153bee9c
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/src/peak.hpp
@@ -0,0 +1,56 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#pragma once
+
+#include <vector>
+
+#include <opencv2/core/core.hpp>
+
+#include "human_pose.hpp"
+
+namespace human_pose_estimation {
+struct Peak {
+    Peak(const int id = -1,
+         const cv::Point2f& pos = cv::Point2f(),
+         const float score = 0.0f);
+
+    int id;
+    cv::Point2f pos;
+    float score;
+};
+
+struct HumanPoseByPeaksIndices {
+    explicit HumanPoseByPeaksIndices(const int keypointsNumber);
+
+    std::vector<int> peaksIndices;
+    int nJoints;
+    float score;
+};
+
+struct TwoJointsConnection {
+    TwoJointsConnection(const int firstJointIdx,
+                        const int secondJointIdx,
+                        const float score);
+
+    int firstJointIdx;
+    int secondJointIdx;
+    float score;
+};
+
+void findPeaks(const std::vector<cv::Mat>& heatMaps,
+               const float minPeaksDistance,
+               std::vector<std::vector<Peak> >& allPeaks,
+               int heatMapId);
+
+std::vector<HumanPose> groupPeaksToPoses(
+        const std::vector<std::vector<Peak> >& allPeaks,
+        const std::vector<cv::Mat>& pafs,
+        const size_t keypointsNumber,
+        const float midPointsScoreThreshold,
+        const float foundMidPointsRatioThreshold,
+        const int minJointsNumber,
+        const float minSubsetScore);
+} // namespace human_pose_estimation
+
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/wrapper.cpp b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/wrapper.cpp
new file mode 100644
index 00000000000..e9d7bfe6243
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/pose_extractor/wrapper.cpp
@@ -0,0 +1,92 @@
+// Copyright (C) 2018-2019 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#define PY_SSIZE_T_CLEAN
+#include <Python.h>
+
+#include <iostream>
+#include <stdexcept>
+#include <vector>
+
+#define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
+#include "numpy/arrayobject.h"
+
+#include <opencv2/core/core.hpp>
+
+#include "extract_poses.hpp"
+
+static std::vector<cv::Mat> wrap_feature_maps(PyArrayObject* py_feature_maps) {
+    int num_channels = static_cast<int>(PyArray_SHAPE(py_feature_maps)[0]);
+    int h = static_cast<int>(PyArray_SHAPE(py_feature_maps)[1]);
+    int w = static_cast<int>(PyArray_SHAPE(py_feature_maps)[2]);
+    float* data = static_cast<float*>(PyArray_DATA(py_feature_maps));
+    std::vector<cv::Mat> feature_maps(num_channels);
+    for (long c_id = 0; c_id < num_channels; c_id++) {
+        feature_maps[c_id] = cv::Mat(h, w, CV_32FC1,
+                                     data + c_id * PyArray_STRIDE(py_feature_maps, 0) / sizeof(float),
+                                     PyArray_STRIDE(py_feature_maps, 1));
+    }
+    return feature_maps;
+}
+
+static PyObject* extract_poses(PyObject* self, PyObject* args) {
+    PyArrayObject* py_heatmaps;
+    PyArrayObject* py_pafs;
+    int ratio;
+    if (!PyArg_ParseTuple(args, "OOi", &py_heatmaps, &py_pafs, &ratio)) {
+        return nullptr;
+    }
+    std::vector<cv::Mat> heatmaps = wrap_feature_maps(py_heatmaps);
+    std::vector<cv::Mat> pafs = wrap_feature_maps(py_pafs);
+
+    std::vector<human_pose_estimation::HumanPose> poses = human_pose_estimation::extractPoses(
+                heatmaps, pafs, ratio);
+
+    size_t num_persons = poses.size();
+    size_t num_keypoints = 0;
+    if (num_persons > 0) {
+        num_keypoints = poses[0].keypoints.size();
+    }
+    npy_intp dims[] = {static_cast<npy_intp>(num_persons), static_cast<npy_intp>(num_keypoints * 3 + 1)};
+    PyObject* out_array = PyArray_SimpleNew(2, dims, NPY_FLOAT);
+    char* out_data = PyArray_BYTES(reinterpret_cast<PyArrayObject*>(out_array));
+    for (size_t person_id = 0; person_id < num_persons; person_id++) {
+        float* person_data = reinterpret_cast<float*>(out_data + PyArray_STRIDE(
+            reinterpret_cast<PyArrayObject*>(out_array), 0) * person_id);
+        for (size_t kpt_id = 0; kpt_id < num_keypoints * 3; kpt_id += 3) {
+            person_data[kpt_id + 0] = poses[person_id].keypoints[kpt_id / 3].x;
+            person_data[kpt_id + 1] = poses[person_id].keypoints[kpt_id / 3].y;
+            person_data[kpt_id + 2] = poses[person_id].keypoints[kpt_id / 3].z;
+        }
+        person_data[num_keypoints * 3] = poses[person_id].score;
+    }
+    return out_array;
+}
+
+PyMethodDef method_table[] = {
+    {"extract_poses", static_cast<PyCFunction>(extract_poses), METH_VARARGS,
+     "Extracts 2D poses from provided heatmaps and pafs"},
+    {NULL, NULL, 0, NULL}
+};
+
+PyModuleDef pose_extractor_module = {
+    PyModuleDef_HEAD_INIT,
+    "pose_extractor",
+    "Module for fast 2D pose extraction",
+    -1,
+    method_table
+};
+
+PyMODINIT_FUNC PyInit_pose_extractor(void) {
+    PyObject* module = PyModule_Create(&pose_extractor_module);
+    if (module == nullptr) {
+        return nullptr;
+    }
+    import_array();
+    if (PyErr_Occurred()) {
+        return nullptr;
+    }
+
+    return module;
+}
diff --git a/demos/python_demos/human_pose_estimation_3d_demo/requirements.txt b/demos/python_demos/human_pose_estimation_3d_demo/requirements.txt
new file mode 100644
index 00000000000..0c697a858e2
--- /dev/null
+++ b/demos/python_demos/human_pose_estimation_3d_demo/requirements.txt
@@ -0,0 +1 @@
+numpy>=1.17.0
diff --git a/demos/python_demos/image_retrieval_demo/README.md b/demos/python_demos/image_retrieval_demo/README.md
index 91c70b38515..63cfa2f88cf 100644
--- a/demos/python_demos/image_retrieval_demo/README.md
+++ b/demos/python_demos/image_retrieval_demo/README.md
@@ -9,7 +9,7 @@ This demo demonstrates how to run Image Retrieval models using OpenVINO&trade;.
 The demo application expects an image retrieval model in the Intermediate Representation (IR) format.
 
 As input, the demo application takes:
-* a path to a list of images represeneted by textfile with following format 'path_to_image' 'ID' `--images`
+* a path to a list of images represented by textfile with following format 'path_to_image' 'ID' `--images`
 * a path to a video file or a device node of a web-camera specified with a command line argument `--video`
 
 The demo workflow is the following:
@@ -51,6 +51,7 @@ Options:
                         Optional. Required for CPU custom layers. Absolute
                         path to a shared library with the kernels
                         implementations.
+  --no_show             Optional. Do not visualize inference results.
 ```
 
 Running the application with an empty list of options yields the short version of the usage message and an error message.
@@ -63,12 +64,15 @@ To run the demo, please provide paths to the model in the IR format, to a file w
 ```bash
 python image_retrieval_demo.py \
 -m /home/user/image-retrieval-0001.xml \
--v /home/user/video.dav.mp4 \
--i /home/user/list.txt \
--l /opt/intel/openvino/inference_engine/lib/intel64/libcpu_extension_avx512.so \
+-i /home/user/video.dav.mp4 \
+-g /home/user/list.txt \
 --ground_truth text_label
 ```
 
+An example of file listing gallery images can be found [here](https://github.com/opencv/openvino_training_extensions/blob/develop/tensorflow_toolkit/image_retrieval/data/gallery/gallery.txt).
+
+Examples of videos can be found [here](https://github.com/19900531/test).
+
 ## Demo Output
 
 The application uses OpenCV to display gallery searching result and current inference performance.
diff --git a/demos/python_demos/image_retrieval_demo/image_retrieval_demo.py b/demos/python_demos/image_retrieval_demo/image_retrieval_demo.py
index a94b6b04d82..0f10a63b65f 100755
--- a/demos/python_demos/image_retrieval_demo/image_retrieval_demo.py
+++ b/demos/python_demos/image_retrieval_demo/image_retrieval_demo.py
@@ -58,6 +58,8 @@ def build_argparser():
                       help="Optional. Required for CPU custom layers. Absolute path to "
                            "a shared library with the kernels implementations.", type=str,
                       default=None)
+    args.add_argument('--no_show', action='store_true',
+                      help='Optional. Do not visualize inference results.')
 
     return parser
 
@@ -141,7 +143,7 @@ def main():
                         [img_retrieval.impaths[i] for i in sorted_indexes],
                         distances[sorted_indexes] if position is not None else None,
                         img_retrieval.input_size, np.mean(compute_embeddings_times),
-                        np.mean(search_in_gallery_times), imshow_delay=3)
+                        np.mean(search_in_gallery_times), imshow_delay=3, no_show=args.no_show)
 
         if key == 27:
             break
diff --git a/demos/python_demos/image_retrieval_demo/image_retrieval_demo/image_retrieval.py b/demos/python_demos/image_retrieval_demo/image_retrieval_demo/image_retrieval.py
index 531425ec587..fbc6b726423 100644
--- a/demos/python_demos/image_retrieval_demo/image_retrieval_demo/image_retrieval.py
+++ b/demos/python_demos/image_retrieval_demo/image_retrieval_demo/image_retrieval.py
@@ -30,11 +30,12 @@ class IEModel(): # pylint: disable=too-few-public-methods
 
     def __init__(self, model_path, device, cpu_extension):
         ie = IECore()
-        if device == 'CPU':
+        if cpu_extension and device == 'CPU':
             ie.add_extension(cpu_extension, 'CPU')
 
         path = '.'.join(model_path.split('.')[:-1])
         self.net = IENetwork(model=path + '.xml', weights=path + '.bin')
+        self.output_name = list(self.net.outputs.keys())[0]
         self.exec_net = ie.load_network(network=self.net, device_name=device)
 
     def predict(self, image):
@@ -42,9 +43,7 @@ def predict(self, image):
 
         assert len(image.shape) == 4
         image = np.transpose(image, (0, 3, 1, 2))
-        out = self.exec_net.infer(inputs={'Placeholder': image})[
-            'model/tf_op_layer_mul/mul/Normalize']
-        out = out / np.linalg.norm(out, axis=-1)
+        out = self.exec_net.infer(inputs={'Placeholder': image})[self.output_name]
         return out
 
 
diff --git a/demos/python_demos/image_retrieval_demo/image_retrieval_demo/visualizer.py b/demos/python_demos/image_retrieval_demo/image_retrieval_demo/visualizer.py
index 4afd2b47a0f..b451c066d54 100644
--- a/demos/python_demos/image_retrieval_demo/image_retrieval_demo/visualizer.py
+++ b/demos/python_demos/image_retrieval_demo/image_retrieval_demo/visualizer.py
@@ -54,7 +54,7 @@ def add_top10_gallery_images(demo_image, impaths, distances, input_image, target
 
 
 def visualize(image, target_pos, impaths, distances, input_size, compute_embedding_time,
-              search_in_gallery_time, imshow_delay):
+              search_in_gallery_time, imshow_delay, no_show=False):
     """ Visualizes input video frame with detected ROI and
         top-10 most similar images from the gallery. """
 
@@ -95,6 +95,9 @@ def visualize(image, target_pos, impaths, distances, input_size, compute_embeddi
 
     demo_image = add_top10_gallery_images(demo_image, impaths, distances, input_image, target_pos)
 
-    cv2.imshow('demo_image', demo_image)
+    if not no_show:
+        cv2.imshow('demo_image', demo_image)
+        key_pressed = cv2.waitKey(imshow_delay)
+        return key_pressed & 0xff if key_pressed != -1 else -1
 
-    return cv2.waitKey(imshow_delay) & 0xff
+    return -1
diff --git a/demos/python_demos/instance_segmentation_demo/README.md b/demos/python_demos/instance_segmentation_demo/README.md
index eff240fe6b1..a416aa1cab0 100644
--- a/demos/python_demos/instance_segmentation_demo/README.md
+++ b/demos/python_demos/instance_segmentation_demo/README.md
@@ -70,6 +70,7 @@ Options:
   -pc, --perf_counts    Optional. Report performance counters.
   -r, --raw_output_message
                         Optional. Output inference results raw values.
+  --no_show             Optional. Don't show output
 ```
 
 Running the application with an empty list of options yields the short version of the usage message and an error message.
@@ -83,7 +84,6 @@ To run the demo, please provide paths to the model in the IR format, to a file w
 python3 instance_segmentation_demo/instance_segmentation_demo.py \
     -m <path_to_model>/instance-segmentation-security-0050.xml \
     --label instance_segmentation_demo/coco_labels.txt \
-    -l <openvino_root>/inference_engine/lib/intel64/libcpu_extension_avx2.so \
     --no_keep_aspect_ratio \
     -i 0 \
     --delay 1
diff --git a/demos/python_demos/instance_segmentation_demo/instance_segmentation_demo.py b/demos/python_demos/instance_segmentation_demo/instance_segmentation_demo.py
index a85de93c378..3b7947c4e75 100644
--- a/demos/python_demos/instance_segmentation_demo/instance_segmentation_demo.py
+++ b/demos/python_demos/instance_segmentation_demo/instance_segmentation_demo.py
@@ -79,6 +79,9 @@ def build_argparser():
     args.add_argument('-r', '--raw_output_message',
                       help='Optional. Output inference results raw values.',
                       action='store_true')
+    args.add_argument("--no_show",
+                      help="Optional. Don't show output",
+                      action='store_true')
     return parser
 
 
@@ -152,7 +155,6 @@ def main():
 
     log.info('Loading IR to the plugin...')
     exec_net = ie.load_network(network=net, device_name=args.device, num_requests=2)
-    del net
 
     try:
         input_source = int(args.input_source)
@@ -259,20 +261,20 @@ def main():
                 print('{:<70} {:<15} {:<15} {:<15} {:<10}'.format(layer, stats['layer_type'], stats['exec_type'],
                                                                   stats['status'], stats['real_time']))
 
-        # Show resulting image.
-        cv2.imshow('Results', frame)
+        if not args.no_show:
+            # Show resulting image.
+            cv2.imshow('Results', frame)
         render_end = time.time()
         render_time = render_end - render_start
 
-        key = cv2.waitKey(args.delay)
-        esc_code = 27
-        if key == esc_code:
-            break
+        if not args.no_show:
+            key = cv2.waitKey(args.delay)
+            esc_code = 27
+            if key == esc_code:
+                break
 
     cv2.destroyAllWindows()
     cap.release()
-    del exec_net
-    del ie
 
 
 if __name__ == '__main__':
diff --git a/demos/python_demos/multi_camera_multi_person_tracking/README.md b/demos/python_demos/multi_camera_multi_person_tracking/README.md
index 4354a161ba0..a7df26b02f6 100644
--- a/demos/python_demos/multi_camera_multi_person_tracking/README.md
+++ b/demos/python_demos/multi_camera_multi_person_tracking/README.md
@@ -66,6 +66,7 @@ optional arguments:
   -l CPU_EXTENSION, --cpu_extension CPU_EXTENSION
                         MKLDNN (CPU)-targeted custom layers.Absolute path to a
                         shared library with the kernels impl.
+  --no_show             Optional. Don't show output
 ```
 Minimum command examples to run the demo:
 
diff --git a/demos/python_demos/multi_camera_multi_person_tracking/multi_camera_multi_person_tracking.py b/demos/python_demos/multi_camera_multi_person_tracking/multi_camera_multi_person_tracking.py
index abafce55a52..c468c736de8 100644
--- a/demos/python_demos/multi_camera_multi_person_tracking/multi_camera_multi_person_tracking.py
+++ b/demos/python_demos/multi_camera_multi_person_tracking/multi_camera_multi_person_tracking.py
@@ -26,6 +26,7 @@
 from utils.misc import read_py_config
 from utils.video import MulticamCapture
 from utils.visualization import visualize_multicam_detections
+from openvino.inference_engine import IECore # pylint: disable=import-error,E0611
 
 log.basicConfig(stream=sys.stdout, level=log.DEBUG)
 
@@ -70,7 +71,7 @@ def run(params, capture, detector, reid):
     else:
         output_video = None
 
-    while cv.waitKey(1) != 27 and thread_body.process:
+    while thread_body.process:
         start = time.time()
         try:
             frames = thread_body.frames_queue.get_nowait()
@@ -91,7 +92,10 @@ def run(params, capture, detector, reid):
 
         fps = round(1 / (time.time() - start), 1)
         vis = visualize_multicam_detections(frames, tracked_objects, fps)
-        cv.imshow(win_name, vis)
+        if not params.no_show:
+            cv.imshow(win_name, vis)
+            if cv.waitKey(1) == 27:
+                break
         if output_video:
             output_video.write(cv.resize(vis, video_output_size))
 
@@ -128,16 +132,20 @@ def main():
                         help='MKLDNN (CPU)-targeted custom layers.Absolute \
                               path to a shared library with the kernels impl.',
                              type=str, default=None)
+    parser.add_argument("--no_show", help="Optional. Don't show output", action='store_true')
 
     args = parser.parse_args()
 
     capture = MulticamCapture(args.i)
 
-    person_detector = Detector(args.m_detector, args.t_detector,
+    log.info("Creating Inference Engine")
+    ie = IECore()
+
+    person_detector = Detector(ie, args.m_detector, args.t_detector,
                                args.device, args.cpu_extension,
                                capture.get_num_sources())
     if args.m_reid:
-        person_recognizer = VectorCNN(args.m_reid, args.device)
+        person_recognizer = VectorCNN(ie, args.m_reid, args.device)
     else:
         person_recognizer = None
     run(args, capture, person_detector, person_recognizer)
diff --git a/demos/python_demos/multi_camera_multi_person_tracking/utils/ie_tools.py b/demos/python_demos/multi_camera_multi_person_tracking/utils/ie_tools.py
index 401f5b441f0..974dfbef800 100644
--- a/demos/python_demos/multi_camera_multi_person_tracking/utils/ie_tools.py
+++ b/demos/python_demos/multi_camera_multi_person_tracking/utils/ie_tools.py
@@ -59,12 +59,12 @@ def get_input_shape(self):
         return self.inputs_info[self.input_key]
 
 
-def load_ie_model(model_xml, device, plugin_dir, cpu_extension='', num_reqs=1):
+def load_ie_model(ie, model_xml, device, plugin_dir, cpu_extension='', num_reqs=1):
     """Loads a model in the Inference Engine format"""
     model_bin = os.path.splitext(model_xml)[0] + ".bin"
     # Plugin initialization for specified device and load extensions library if specified
-    log.info("Creating Inference Engine")
-    ie = IECore()
+    log.info("Initializing Inference Engine plugin for %s ", device)
+
     if cpu_extension and 'CPU' in device:
         ie.add_extension(cpu_extension, 'CPU')
     # Read IR
diff --git a/demos/python_demos/multi_camera_multi_person_tracking/utils/network_wrappers.py b/demos/python_demos/multi_camera_multi_person_tracking/utils/network_wrappers.py
index 18ccf70400e..c13f9d7b628 100644
--- a/demos/python_demos/multi_camera_multi_person_tracking/utils/network_wrappers.py
+++ b/demos/python_demos/multi_camera_multi_person_tracking/utils/network_wrappers.py
@@ -17,8 +17,8 @@
 class Detector:
     """Wrapper class for detector"""
 
-    def __init__(self, model_path, conf=.6, device='CPU', ext_path='', max_num_frames=1):
-        self.net = load_ie_model(model_path, device, None, ext_path, num_reqs=max_num_frames)
+    def __init__(self, ie, model_path, conf=.6, device='CPU', ext_path='', max_num_frames=1):
+        self.net = load_ie_model(ie, model_path, device, None, ext_path, num_reqs=max_num_frames)
         self.confidence = conf
         self.expand_ratio = (1., 1.)
         self.max_num_frames = max_num_frames
@@ -70,9 +70,9 @@ def __decode_detections(self, out, frame_shape):
 class VectorCNN:
     """Wrapper class for a network returning a vector"""
 
-    def __init__(self, model_path, device='CPU', max_reqs=100):
+    def __init__(self, ie, model_path, device='CPU', max_reqs=100):
         self.max_reqs = max_reqs
-        self.net = load_ie_model(model_path, device, None, num_reqs=self.max_reqs)
+        self.net = load_ie_model(ie, model_path, device, None, num_reqs=self.max_reqs)
 
     def forward(self, batch):
         """Performs forward of the underlying network on a given batch"""
diff --git a/demos/python_demos/object_detection_demo_centernet/README.md b/demos/python_demos/object_detection_demo_centernet/README.md
new file mode 100644
index 00000000000..ed9c8781107
--- /dev/null
+++ b/demos/python_demos/object_detection_demo_centernet/README.md
@@ -0,0 +1,49 @@
+# Object Detection CenterNet Demo
+
+This demo showcases Object Detection with CenterNet. The task is to identify objects as axis-aligned boxes in an image.
+CenterNet models an object as a single point - the center point of its bounding box and uses keypoint estimation to find center points and regresses to object size. The same approach is used to estimate 3D bounding box and pose.
+
+## How It Works
+
+On the start-up, the application reads command-line parameters and loads a network to the Inference
+Engine. Upon getting a frame from the OpenCV VideoCapture, it performs inference and displays the results.
+
+## Running
+
+Running the application with the <code>-h</code> option yields the following usage message:
+
+```
+usage: object_detection_demo_centernet.py [-h] -m MODEL [-i INPUT [INPUT ...]]
+                                          [--labels LABELS]
+                                          [-pt PROB_THRESHOLD] [--no_show]
+
+Options:
+  -h, --help            Show this help message and exit.
+  -m MODEL, --model MODEL
+                        Required. Path to an .xml file with a trained model.
+  -i INPUT [INPUT ...], --input INPUT [INPUT ...]
+                        path to video or image/images
+  -d DEVICE, --device DEVICE
+                        Optional. Specify the target device to infer on; CPU,
+                        GPU, FPGA, HDDL or MYRIAD is acceptable. The demo will
+                        look for a suitable plugin for device specified.
+                        Default value is CPU
+  --labels LABELS       Optional. Path to labels mapping file
+  -pt PROB_THRESHOLD, --prob_threshold PROB_THRESHOLD
+                        Optional. Probability threshold for detections
+                        filtering
+  --no_show             Optional. Don't show output
+```
+
+To run the demo, you can use public or pre-trained models. You can download the pre-trained models with the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or from [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (\*.xml + \*.bin) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+
+## Demo Output
+
+The demo uses OpenCV to display the resulting frame with detections (rendered as bounding boxes and labels, if provided) and reports performance in the following format: summary inference FPS.
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/object_detection_demo_centernet/detector.py b/demos/python_demos/object_detection_demo_centernet/detector.py
new file mode 100644
index 00000000000..09bcb64ad6b
--- /dev/null
+++ b/demos/python_demos/object_detection_demo_centernet/detector.py
@@ -0,0 +1,214 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import os
+import cv2
+import numpy as np
+from numpy.lib.stride_tricks import as_strided
+
+from openvino.inference_engine import IENetwork, IECore
+
+class Detector(object):
+    def __init__(self, ie, model_path, threshold=0.3, device='CPU'):
+        model = IENetwork(model=model_path, weights=os.path.splitext(model_path)[0] + '.bin')
+
+        assert len(model.inputs) == 1, "Expected 1 input blob"
+        assert len(model.outputs) == 3, "Expected 3 output blobs"
+
+        self._input_layer_name = next(iter(model.inputs))
+        self._output_layer_names = sorted(model.outputs)
+
+        self._ie = ie
+        self._exec_model = self._ie.load_network(model, device)
+        self._threshold = threshold
+        self.infer_time = -1
+        _, channels, self.input_height, self.input_width = model.inputs[self._input_layer_name].shape
+        assert channels == 3, "Expected 3-channel input"
+
+    @staticmethod
+    def get_affine_transform(center, scale, rot, output_size, inv=False):
+
+        def get_dir(src_point, rot_rad):
+            sn, cs = np.sin(rot_rad), np.cos(rot_rad)
+            src_result = [0, 0]
+            src_result[0] = src_point[0] * cs - src_point[1] * sn
+            src_result[1] = src_point[0] * sn + src_point[1] * cs
+            return src_result
+
+        def get_3rd_point(a, b):
+            direct = a - b
+            return b + np.array([-direct[1], direct[0]], dtype=np.float32)
+
+        if not isinstance(scale, np.ndarray) and not isinstance(scale, list):
+            scale = np.array([scale, scale], dtype=np.float32)
+
+        scale_tmp = scale
+        src_w = scale_tmp[0]
+        dst_w, dst_h = output_size
+
+        rot_rad = np.pi * rot / 180
+        src_dir = get_dir([0, src_w * -0.5], rot_rad)
+        dst_dir = np.array([0, dst_w * -0.5], dtype=np.float32)
+
+        dst = np.zeros((3, 2), dtype=np.float32)
+        src = np.zeros((3, 2), dtype=np.float32)
+        src[0, :], src[1, :] = center, center + src_dir
+        dst[0, :] = [dst_w * 0.5, dst_h * 0.5]
+        dst[1, :] = np.array([dst_w * 0.5, dst_h * 0.5], np.float32) + dst_dir
+        src[2:, :] = get_3rd_point(src[0, :], src[1, :])
+        dst[2:, :] = get_3rd_point(dst[0, :], dst[1, :])
+
+        if inv:
+            trans = cv2.getAffineTransform(np.float32(dst), np.float32(src))
+        else:
+            trans = cv2.getAffineTransform(np.float32(src), np.float32(dst))
+
+        return trans
+
+    @staticmethod
+    def _gather_feat(feat, ind):
+        dim = feat.shape[1]
+        ind = np.expand_dims(ind, axis=1)
+        ind = np.repeat(ind, dim, axis=1)
+        feat = feat[ind, np.arange(feat.shape[1])]
+        return feat
+
+    @staticmethod
+    def _tranpose_and_gather_feat(feat, ind):
+        feat = np.transpose(feat, (1, 2, 0))
+        feat = feat.reshape((-1, feat.shape[2]))
+        feat = Detector._gather_feat(feat, ind)
+        return feat
+
+    @staticmethod
+    def _topk(scores, K=40):
+        cat, _, width = scores.shape
+
+        scores = scores.reshape((cat, -1))
+        topk_inds = np.argpartition(scores, -K, axis=1)[:, -K:]
+        topk_scores = scores[np.arange(scores.shape[0])[:, None], topk_inds]
+
+        topk_ys = (topk_inds / width).astype(np.int32).astype(np.float)
+        topk_xs = (topk_inds % width).astype(np.int32).astype(np.float)
+
+        topk_scores = topk_scores.reshape((-1))
+        topk_ind = np.argpartition(topk_scores, -K)[-K:]
+        topk_score = topk_scores[topk_ind]
+        topk_clses = topk_ind / K
+        topk_inds = Detector._gather_feat(
+            topk_inds.reshape((-1, 1)), topk_ind).reshape((K))
+        topk_ys = Detector._gather_feat(topk_ys.reshape((-1, 1)), topk_ind).reshape((K))
+        topk_xs = Detector._gather_feat(topk_xs.reshape((-1, 1)), topk_ind).reshape((K))
+
+        return topk_score, topk_inds, topk_clses, topk_ys, topk_xs
+
+    @staticmethod
+    def _nms(heat, kernel=3):
+        def max_pool2d(A, kernel_size, padding=1, stride=1):
+            A = np.pad(A, padding, mode='constant')
+            output_shape = ((A.shape[0] - kernel_size)//stride + 1,
+                            (A.shape[1] - kernel_size)//stride + 1)
+            kernel_size = (kernel_size, kernel_size)
+            A_w = as_strided(A, shape=output_shape + kernel_size,
+                             strides=(stride*A.strides[0],
+                                      stride*A.strides[1]) + A.strides)
+            A_w = A_w.reshape(-1, *kernel_size)
+
+            return A_w.max(axis=(1, 2)).reshape(output_shape)
+
+        pad = (kernel - 1) // 2
+
+        hmax = np.array([max_pool2d(channel, kernel, pad) for channel in heat])
+        keep = (hmax == heat)
+        return heat * keep
+
+    @staticmethod
+    def _transform_preds(coords, center, scale, output_size):
+        def affine_transform(pt, t):
+            new_pt = np.array([pt[0], pt[1], 1.], dtype=np.float32).T
+            new_pt = np.dot(t, new_pt)
+            return new_pt[:2]
+
+        target_coords = np.zeros(coords.shape)
+        trans = Detector.get_affine_transform(center, scale, 0, output_size, inv=True)
+        for p in range(coords.shape[0]):
+            target_coords[p, 0:2] = affine_transform(coords[p, 0:2], trans)
+        return target_coords
+
+    @staticmethod
+    def _transform(dets, center, scale, height, width):
+        dets[:, :2] = Detector._transform_preds(
+            dets[:, 0:2], center, scale, (width, height))
+        dets[:, 2:4] = Detector._transform_preds(
+            dets[:, 2:4], center, scale, (width, height))
+        return dets
+
+    def preprocess(self, image):
+        height, width = image.shape[0:2]
+        center = np.array([width / 2., height / 2.], dtype=np.float32)
+        scale = max(height, width)
+
+        trans_input = self.get_affine_transform(center, scale, 0, [self.input_width, self.input_height])
+        resized_image = cv2.resize(image, (width, height))
+        inp_image = cv2.warpAffine(
+            resized_image, trans_input, (self.input_width, self.input_height),
+            flags=cv2.INTER_LINEAR)
+
+        return inp_image
+
+    def postprocess(self, raw_output, image_sizes):
+        heat, reg, wh = raw_output
+        heat = heat = np.exp(heat)/(1 + np.exp(heat))
+        height, width = heat.shape[1:3]
+        num_predictions = 100
+
+        heat = self._nms(heat)
+        scores, inds, clses, ys, xs = self._topk(heat, K=num_predictions)
+        reg = self._tranpose_and_gather_feat(reg, inds)
+
+        reg = reg.reshape((num_predictions, 2))
+        xs = xs.reshape((num_predictions, 1)) + reg[:, 0:1]
+        ys = ys.reshape((num_predictions, 1)) + reg[:, 1:2]
+
+        wh = self._tranpose_and_gather_feat(wh, inds)
+        wh = wh.reshape((num_predictions, 2))
+        clses = clses.reshape((num_predictions, 1))
+        scores = scores.reshape((num_predictions, 1))
+        bboxes = np.concatenate((xs - wh[..., 0:1] / 2,
+                                 ys - wh[..., 1:2] / 2,
+                                 xs + wh[..., 0:1] / 2,
+                                 ys + wh[..., 1:2] / 2), axis=1)
+        detections = np.concatenate((bboxes, scores, clses), axis=1)
+        mask = detections[..., 4] >= self._threshold
+        filtered_detections = detections[mask]
+        scale = max(image_sizes)
+        center = np.array(image_sizes[:2])/2.0
+        dets = self._transform(filtered_detections, np.flip(center, 0), scale, height, width)
+        return dets
+
+    def infer(self, image):
+        t0 = cv2.getTickCount()
+        output = self._exec_model.infer(inputs={self._input_layer_name: image})
+        self.infer_time = (cv2.getTickCount() - t0) / cv2.getTickFrequency()
+        return output
+
+    def detect(self, image):
+        image_sizes = image.shape[:2]
+        image = self.preprocess(image)
+        image = np.transpose(image, (2, 0, 1))
+        output = self.infer(image)
+        detections = self.postprocess([output[name][0] for name in self._output_layer_names], image_sizes)
+        return detections
diff --git a/demos/python_demos/object_detection_demo_centernet/models.lst b/demos/python_demos/object_detection_demo_centernet/models.lst
new file mode 100644
index 00000000000..4d8bbdb7af6
--- /dev/null
+++ b/demos/python_demos/object_detection_demo_centernet/models.lst
@@ -0,0 +1,3 @@
+# This file can be used with the --list option of the model downloader.
+ctdet_coco_dlav0_384
+ctdet_coco_dlav0_512
diff --git a/demos/python_demos/object_detection_demo_centernet/object_detection_demo_centernet.py b/demos/python_demos/object_detection_demo_centernet/object_detection_demo_centernet.py
new file mode 100644
index 00000000000..22b7a64af2b
--- /dev/null
+++ b/demos/python_demos/object_detection_demo_centernet/object_detection_demo_centernet.py
@@ -0,0 +1,123 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+import sys
+import cv2
+import numpy as np
+from argparse import ArgumentParser, SUPPRESS
+
+from openvino.inference_engine import IECore
+
+from detector import Detector
+
+def build_argparser():
+    parser = ArgumentParser(add_help=False)
+    args = parser.add_argument_group('Options')
+    args.add_argument('-h', '--help', action='help', default=SUPPRESS, help='Show this help message and exit.')
+    args.add_argument("-m", "--model", help="Required. Path to an .xml file with a trained model.",
+                      required=True, type=str)
+    args.add_argument("-i", "--input", type=str, nargs='+', default='', help="path to video or image/images")
+    args.add_argument("-d", "--device",
+                      help="Optional. Specify the target device to infer on; CPU, GPU, FPGA, HDDL or MYRIAD is "
+                           "acceptable. The demo will look for a suitable plugin for device specified. "
+                           "Default value is CPU", default="CPU", type=str)
+    args.add_argument("--labels", help="Optional. Path to labels mapping file", default=None, type=str)
+    args.add_argument("-pt", "--prob_threshold", help="Optional. Probability threshold for detections filtering",
+                      default=0.3, type=float)
+    args.add_argument("--no_show", help="Optional. Don't show output", action='store_true')
+
+    return parser
+
+class ImageReader(object):
+    def __init__(self, file_names):
+        self.file_names = file_names
+        self.max_idx = len(file_names)
+
+    def __iter__(self):
+        self.idx = 0
+        return self
+
+    def __next__(self):
+        if self.idx == self.max_idx:
+            raise StopIteration
+        img = cv2.imread(self.file_names[self.idx], cv2.IMREAD_COLOR)
+        if img.size == 0:
+            raise IOError('Image {} cannot be read'.format(self.file_names[self.idx]))
+        self.idx += 1
+        return img
+
+
+class VideoReader(object):
+    def __init__(self, file_name):
+        try:
+            self.file_name = int(file_name[0])
+        except:
+            self.file_name = file_name[0]
+
+
+    def __iter__(self):
+        self.cap = cv2.VideoCapture(self.file_name)
+        if not self.cap.isOpened():
+            raise IOError('Video {} cannot be opened'.format(self.file_name))
+        return self
+
+    def __next__(self):
+        was_read, img = self.cap.read()
+        if not was_read:
+            raise StopIteration
+        return img
+
+def main():
+    args = build_argparser().parse_args()
+
+    ie = IECore()
+    detector = Detector(ie, args.model, args.prob_threshold, args.device)
+
+    img = cv2.imread(args.input[0], cv2.IMREAD_COLOR)
+    frames_reader, delay = (VideoReader(args.input), 1) if img is None else (ImageReader(args.input), 0)
+
+    if args.labels:
+        with open(args.labels, 'r') as f:
+            labels_map = [x.strip() for x in f]
+    else:
+        labels_map = None
+
+    for frame in frames_reader:
+        detections = detector.detect(frame)
+        for det in detections:
+            xmin, ymin, xmax, ymax = det[:4].astype(np.int)
+            xmin = max(0, xmin)
+            ymin = max(0, ymin)
+            xmax = min(frame.shape[1], xmax)
+            ymax = min(frame.shape[0], ymax)
+            class_id = det[5]
+            det_label = labels_map[int(class_id)] if labels_map else str(int(class_id))
+            color = (min(class_id * 12.5, 255), min(class_id * 7, 255), min(class_id * 3, 255))
+            cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), color, 2)
+            cv2.putText(frame, det_label + ' ' + str(round(det[4] * 100, 1)) + ' %', (xmin, ymin - 7),
+                         cv2.FONT_HERSHEY_COMPLEX, 0.6, color, 1)
+
+        cv2.putText(frame, 'summary: {:.1f} FPS'.format(
+            float(1 / (detector.infer_time * len(detections)))), (5, 15), cv2.FONT_HERSHEY_COMPLEX, 0.5, (0, 0, 200))
+        if args.no_show:
+            continue
+        cv2.imshow('CenterNet Detection Demo', frame)
+        key = cv2.waitKey(delay)
+        if key == 27:
+            return
+
+if __name__ == "__main__":
+    sys.exit(main() or 0)
+
diff --git a/demos/python_demos/object_detection_demo_ssd_async/README.md b/demos/python_demos/object_detection_demo_ssd_async/README.md
index e1740e532b2..703fedda256 100644
--- a/demos/python_demos/object_detection_demo_ssd_async/README.md
+++ b/demos/python_demos/object_detection_demo_ssd_async/README.md
@@ -131,6 +131,7 @@ Options:
   -pt PROB_THRESHOLD, --prob_threshold PROB_THRESHOLD
                         Optional. Probability threshold for detections
                         filtering
+  --no_show             Optional. Don't show output
 ```
 
 Running the application with the empty list of options yields the usage message given above and an error message.
diff --git a/demos/python_demos/object_detection_demo_ssd_async/models.lst b/demos/python_demos/object_detection_demo_ssd_async/models.lst
index 70702bc6921..c6544958d4d 100644
--- a/demos/python_demos/object_detection_demo_ssd_async/models.lst
+++ b/demos/python_demos/object_detection_demo_ssd_async/models.lst
@@ -5,6 +5,7 @@ face-detection-retail-????
 pedestrian-and-vehicle-detector-adas-????
 pedestrian-detection-adas-????
 pedestrian-detection-adas-binary-????
+person-detection-retail-0013
 vehicle-detection-adas-????
 vehicle-detection-adas-binary-????
 vehicle-license-plate-detection-barrier-????
diff --git a/demos/python_demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.py b/demos/python_demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.py
index d901fe8d5af..ec63397b63e 100755
--- a/demos/python_demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.py
+++ b/demos/python_demos/object_detection_demo_ssd_async/object_detection_demo_ssd_async.py
@@ -45,6 +45,7 @@ def build_argparser():
     args.add_argument("--labels", help="Optional. Path to labels mapping file", default=None, type=str)
     args.add_argument("-pt", "--prob_threshold", help="Optional. Probability threshold for detections filtering",
                       default=0.5, type=float)
+    args.add_argument("--no_show", help="Optional. Don't show output", action='store_true')
 
     return parser
 
@@ -98,22 +99,24 @@ def main():
         input_stream = 0
     else:
         input_stream = args.input
-        assert os.path.isfile(args.input), "Specified input file doesn't exist"
+    cap = cv2.VideoCapture(input_stream)
+    assert cap.isOpened(), "Can't open " + input_stream
+
     if args.labels:
         with open(args.labels, 'r') as f:
             labels_map = [x.strip() for x in f]
     else:
         labels_map = None
 
-    cap = cv2.VideoCapture(input_stream)
-
     cur_request_id = 0
     next_request_id = 1
 
     log.info("Starting inference in async mode...")
     is_async_mode = True
     render_time = 0
-    ret, frame = cap.read()
+    if is_async_mode:
+        ret, frame = cap.read()
+        frame_h, frame_w = frame.shape[:2]
 
     print("To close the application, press 'CTRL+C' here or switch to the output window and press ESC key")
     print("To switch between sync/async modes, press TAB key in the output window")
@@ -123,10 +126,10 @@ def main():
             ret, next_frame = cap.read()
         else:
             ret, frame = cap.read()
+            if ret:
+                frame_h, frame_w = frame.shape[:2]
         if not ret:
-            break
-        initial_w = cap.get(3)
-        initial_h = cap.get(4)
+            break  # abandons the last frame in case of async_mode
         # Main sync point:
         # in the truly Async mode we start the NEXT infer request, while waiting for the CURRENT to complete
         # in the regular mode we start the CURRENT request and immediately wait for it's completion
@@ -152,10 +155,10 @@ def main():
             for obj in res[0][0]:
                 # Draw only objects when probability more than specified threshold
                 if obj[2] > args.prob_threshold:
-                    xmin = int(obj[3] * initial_w)
-                    ymin = int(obj[4] * initial_h)
-                    xmax = int(obj[5] * initial_w)
-                    ymax = int(obj[6] * initial_h)
+                    xmin = int(obj[3] * frame_w)
+                    ymin = int(obj[4] * frame_h)
+                    xmax = int(obj[5] * frame_w)
+                    ymax = int(obj[6] * frame_h)
                     class_id = int(obj[1])
                     # Draw box and label\class_id
                     color = (min(class_id * 12.5, 255), min(class_id * 7, 255), min(class_id * 5, 255))
@@ -173,25 +176,28 @@ def main():
 
             cv2.putText(frame, inf_time_message, (15, 15), cv2.FONT_HERSHEY_COMPLEX, 0.5, (200, 10, 10), 1)
             cv2.putText(frame, render_time_message, (15, 30), cv2.FONT_HERSHEY_COMPLEX, 0.5, (10, 10, 200), 1)
-            cv2.putText(frame, async_mode_message, (10, int(initial_h - 20)), cv2.FONT_HERSHEY_COMPLEX, 0.5,
+            cv2.putText(frame, async_mode_message, (10, int(frame_h - 20)), cv2.FONT_HERSHEY_COMPLEX, 0.5,
                         (10, 10, 200), 1)
 
         #
         render_start = time.time()
-        cv2.imshow("Detection Results", frame)
+        if not args.no_show:
+            cv2.imshow("Detection Results", frame)
         render_end = time.time()
         render_time = render_end - render_start
 
         if is_async_mode:
             cur_request_id, next_request_id = next_request_id, cur_request_id
             frame = next_frame
-
-        key = cv2.waitKey(1)
-        if key == 27:
-            break
-        if (9 == key):
-            is_async_mode = not is_async_mode
-            log.info("Switched to {} mode".format("async" if is_async_mode else "sync"))
+            frame_h, frame_w = frame.shape[:2]
+
+        if not args.no_show:
+            key = cv2.waitKey(1)
+            if key == 27:
+                break
+            if (9 == key):
+                is_async_mode = not is_async_mode
+                log.info("Switched to {} mode".format("async" if is_async_mode else "sync"))
 
     cv2.destroyAllWindows()
 
diff --git a/demos/python_demos/object_detection_demo_yolov3_async/README.md b/demos/python_demos/object_detection_demo_yolov3_async/README.md
index 45ab11b7b4e..49734abf1cf 100644
--- a/demos/python_demos/object_detection_demo_yolov3_async/README.md
+++ b/demos/python_demos/object_detection_demo_yolov3_async/README.md
@@ -39,7 +39,7 @@ Options:
   -m MODEL, --model MODEL
                         Required. Path to an .xml file with a trained model.
   -i INPUT, --input INPUT
-                        Required. Path to a image/video file. (Specify 'cam'
+                        Required. Path to an image/video file. (Specify 'cam'
                         to work with camera)
   -l CPU_EXTENSION, --cpu_extension CPU_EXTENSION
                         Optional. Required for CPU custom layers. Absolute
diff --git a/demos/python_demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.py b/demos/python_demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.py
index 3ad8540badd..53bcf8ccc7f 100755
--- a/demos/python_demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.py
+++ b/demos/python_demos/object_detection_demo_yolov3_async/object_detection_demo_yolov3_async.py
@@ -36,7 +36,7 @@ def build_argparser():
     args.add_argument('-h', '--help', action='help', default=SUPPRESS, help='Show this help message and exit.')
     args.add_argument("-m", "--model", help="Required. Path to an .xml file with a trained model.",
                       required=True, type=str)
-    args.add_argument("-i", "--input", help="Required. Path to a image/video file. (Specify 'cam' to work with "
+    args.add_argument("-i", "--input", help="Required. Path to an image/video file. (Specify 'cam' to work with "
                                             "camera)", required=True, type=str)
     args.add_argument("-l", "--cpu_extension",
                       help="Optional. Required for CPU custom layers. Absolute path to a shared library with "
diff --git a/demos/python_demos/requirements.txt b/demos/python_demos/requirements.txt
index 6f1e5232f72..e76286bba86 100644
--- a/demos/python_demos/requirements.txt
+++ b/demos/python_demos/requirements.txt
@@ -1,2 +1,5 @@
-opencv-python
-numpy
\ No newline at end of file
+nibabel
+numpy
+scikit-learn
+scipy
+tqdm
diff --git a/demos/python_demos/segmentation_demo/segmentation_demo.py b/demos/python_demos/segmentation_demo/segmentation_demo.py
index a5b7faabf35..f6f94779964 100755
--- a/demos/python_demos/segmentation_demo/segmentation_demo.py
+++ b/demos/python_demos/segmentation_demo/segmentation_demo.py
@@ -100,11 +100,17 @@ def main():
     out_blob = next(iter(net.outputs))
     net.batch_size = len(args.input)
 
+    # NB: This is required to load the image as uint8 np.array
+    #     Without this step the input blob is loaded in FP32 precision,
+    #     this requires additional operation and more memory.
+    net.inputs[input_blob].precision = "U8"
+
     # Read and pre-process input images
     n, c, h, w = net.inputs[input_blob].shape
     images = np.ndarray(shape=(n, c, h, w))
     for i in range(n):
         image = cv2.imread(args.input[i])
+        assert image.dtype == np.uint8
         if image.shape[:-1] != (h, w):
             log.warning("Image {} is resized from {} to {}".format(args.input[i], image.shape[:-1], (h, w)))
             image = cv2.resize(image, (w, h))
diff --git a/demos/python_demos/single_human_pose_estimation_demo/README.md b/demos/python_demos/single_human_pose_estimation_demo/README.md
new file mode 100644
index 00000000000..75d2f2588ca
--- /dev/null
+++ b/demos/python_demos/single_human_pose_estimation_demo/README.md
@@ -0,0 +1,46 @@
+# Single Human Pose Estimation Demo (top-down pipeline)
+
+This demo showcases top-down pipeline for human pose estimation on video or image. The task is to predict bboxes for every person on frame and then to predict a pose for every detected person. The pose may contain up to 17 keypoints: ears, eyes, nose, shoulders, elbows, wrists, hips, knees, and ankles.
+
+# How It Works
+
+On the start-up, the application reads command line parameters and loads detection person model and single human pose estimation model. Upon getting a frame from the OpenCV VideoCapture, the demo executes top-down pipeline for this frame and displays the results.
+
+# Running
+
+Running the application with the `-h` option yields the following usage message:
+```
+usage: single_human_pose_estimation_demo.py [-h] -m_od MODEL_OD -m_hpe
+                                            MODEL_HPE [-i INPUT [INPUT ...]]
+                                            [-d DEVICE]
+                                            [--person_label PERSON_LABEL]
+                                            [--no_show]
+
+optional arguments:
+  -h, --help            show this help message and exit
+  -m_od MODEL_OD, --model_od MODEL_OD
+                        path to model of object detector in xml format
+  -m_hpe MODEL_HPE, --model_hpe MODEL_HPE
+                        path to model of human pose estimator in xml format
+  -i INPUT [INPUT ...], --input INPUT [INPUT ...]
+                        path to video or image/images
+  -d DEVICE, --device DEVICE
+                        Specify the target to infer on CPU or GPU
+  --person_label PERSON_LABEL
+                        Label of class person for detector
+  --no_show             Optional. Do not display output.
+```
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO Model Downloader or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+For example, to do inference on a CPU, run the following command:
+
+```sh
+python single_human_pose_estimation_demo.py --model_od <path_to_dir__with_models>/mobilenet-ssd.xml --model_hpe <path_to_dir__with_models>/single-human-pose-estimation-0001.xml --input <path_to_video>/back-passengers.avi
+```
+
+The demo uses OpenCV to display the resulting frame with estimated poses and reports performance in the following format: summary inference FPS (single human pose inference FPS / detector inference FPS).
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/single_human_pose_estimation_demo/detector.py b/demos/python_demos/single_human_pose_estimation_demo/detector.py
new file mode 100644
index 00000000000..a02dd5b63fb
--- /dev/null
+++ b/demos/python_demos/single_human_pose_estimation_demo/detector.py
@@ -0,0 +1,72 @@
+import os
+import cv2
+
+from openvino.inference_engine import IENetwork, IECore
+
+
+class Detector(object):
+    def __init__(self, ie, path_to_model_xml, label_class, scale=None, thr=0.3, device='CPU'):
+        self.OUTPUT_SIZE = 7
+        self.CHANNELS_SIZE = 3
+        self.model = IENetwork(model=path_to_model_xml, weights=os.path.splitext(path_to_model_xml)[0] + '.bin')
+
+        assert len(self.model.inputs) == 1, "Expected 1 input blob"
+
+        assert len(self.model.outputs) == 1, "Expected 1 output blob"
+
+        self._input_layer_name = next(iter(self.model.inputs))
+        self._output_layer_name = next(iter(self.model.outputs))
+
+        assert len(self.model.inputs[self._input_layer_name].shape) == 4 and \
+               self.model.inputs[self._input_layer_name].shape[1] == self.CHANNELS_SIZE, \
+            "Expected model output shape with %s channels " % (self.CHANNELS_SIZE)
+
+        assert len(self.model.outputs[self._output_layer_name].shape) == 4 and \
+               self.model.outputs[self._output_layer_name].shape[3] == self.OUTPUT_SIZE, \
+            "Expected model output shape with %s outputs" % (self.OUTPUT_SIZE)
+
+        self._ie = ie
+        self._exec_model = self._ie.load_network(self.model, device)
+        self._scale = scale
+        self._thr = thr
+        self._label_class = label_class
+        _, _, self.input_h, self.input_w = self.model.inputs[self._input_layer_name].shape
+        self._h = -1
+        self._w = -1
+        self.infer_time = -1
+
+    def _preprocess(self, img):
+        self._h, self._w, _ = img.shape
+        if self._h != self.input_h or self._w != self.input_w:
+            img = cv2.resize(img, dsize=(self.input_w, self.input_h), fy=self._h / self.input_h,
+                             fx=self._h / self.input_h)
+        img = img.transpose(2, 0, 1)
+        return img[None, ]
+
+    def _infer(self, prep_img):
+        t0 = cv2.getTickCount()
+        output = self._exec_model.infer(inputs={self._input_layer_name: prep_img})
+        self.infer_time = (cv2.getTickCount() - t0) / cv2.getTickFrequency()
+        return output
+
+
+    def _postprocess(self, bboxes):
+
+        def coord_translation(bbox):
+            xmin = int(self._w * bbox[0])
+            ymin = int(self._h * bbox[1])
+            xmax = int(self._w * bbox[2])
+            ymax = int(self._h * bbox[3])
+            w_box = xmax - xmin
+            h_box = ymax - ymin
+            return [xmin, ymin, w_box, h_box]
+
+        bboxes_new = [coord_translation(bbox[3:]) for bbox in bboxes if bbox[1] == self._label_class and bbox[2] > self._thr]
+
+        return bboxes_new
+
+    def detect(self, img):
+        img = self._preprocess(img)
+        output = self._infer(img)
+        bboxes = self._postprocess(output[self._output_layer_name][0][0])
+        return bboxes
diff --git a/demos/python_demos/single_human_pose_estimation_demo/estimator.py b/demos/python_demos/single_human_pose_estimation_demo/estimator.py
new file mode 100644
index 00000000000..105d152b9cd
--- /dev/null
+++ b/demos/python_demos/single_human_pose_estimation_demo/estimator.py
@@ -0,0 +1,137 @@
+import os
+import numpy as np
+
+import cv2
+from openvino.inference_engine import IENetwork
+
+def preprocess_bbox(bbox, image):
+    aspect_ratio = 0.75
+    bbox[0] = np.clip(bbox[0], 0, image.shape[0] - 1)
+    bbox[1] = np.clip(bbox[1], 0, image.shape[0] - 1)
+    x2 = np.min((image.shape[1] - 1, bbox[0] + np.max((0, bbox[2] - 1))))
+    y2 = np.min((image.shape[0] - 1, bbox[1] + np.max((0, bbox[3] - 1))))
+
+    bbox = [bbox[0], bbox[1], x2 - bbox[0], y2 - bbox[1]]
+
+    cx_bbox = bbox[0] + bbox[2] * 0.5
+    cy_bbox = bbox[1] + bbox[3] * 0.5
+    center = np.array([np.float32(cx_bbox), np.float32(cy_bbox)])
+
+    if bbox[2] > aspect_ratio * bbox[3]:
+        bbox[3] = bbox[2] * 1.0 / aspect_ratio
+    elif bbox[2] < aspect_ratio * bbox[3]:
+        bbox[2] = bbox[3] * aspect_ratio
+
+    s = np.array([bbox[2], bbox[3]], np.float32)
+    scale = s * 1.25
+
+    return center, scale
+
+
+def extract_keypoints(heatmap, min_confidence=-100):
+    ind = np.unravel_index(np.argmax(heatmap, axis=None), heatmap.shape)
+    if heatmap[ind] < min_confidence:
+        ind = (-1, -1)
+    else:
+        ind = (int(ind[1]), int(ind[0]))
+    return heatmap[ind[1]][ind[0]], ind
+
+
+def affine_transform(pt, t):
+        transformed_point = np.dot(t, [pt[0], pt[1], 1.])[:2]
+        return transformed_point
+
+
+class TransformedCrop(object):
+    def __init__(self, input_height=384, input_width=288, output_height=48, output_width=36):
+        self._num_keypoints = 17
+        self.input_width = input_width
+        self.input_height = input_height
+        self.output_width = output_width
+        self.output_height = output_height
+
+    def __call__(self, img, bbox):
+        c, s = preprocess_bbox(bbox, img)
+        trans, _ = self.get_trasformation_matrix(c, s, [self.input_width, self.input_height])
+        transformed_image = cv2.warpAffine(img, trans, (self.input_width, self.input_height), flags=cv2.INTER_LINEAR)
+        rev_trans = self.get_trasformation_matrix(c, s, [self.output_width, self.output_height])[1]
+
+        return rev_trans, transformed_image.transpose(2, 0, 1)[None, ]
+
+    @staticmethod
+    def get_trasformation_matrix(center, scale, output_size):
+
+        w, h = scale
+        points = np.zeros((3, 2), dtype=np.float32)
+        transformed_points = np.zeros((3, 2), dtype=np.float32)
+
+        transformed_points[0, :] = [output_size[0] * 0.5, output_size[1] * 0.5]
+        transformed_points[1, :] = [output_size[0] * 0.5, output_size[1] * 0.5 - output_size[0] * 0.5]
+        transformed_points[2, :] = [0, output_size[1] * 0.5]
+
+        shift_y = [0, - w * 0.5]
+        shift_x = [- w * 0.5, 0]
+
+        points[0, :] = center
+        points[1, :] = center + shift_y
+        points[2, :] = center + shift_x
+
+        rev_trans = cv2.getAffineTransform(np.float32(transformed_points), np.float32(points))
+
+        trans = cv2.getAffineTransform(np.float32(points), np.float32(transformed_points))
+
+        return trans, rev_trans
+
+
+class HumanPoseEstimator(object):
+    def __init__(self, ie, path_to_model_xml, scale=None, thr=-100, device='CPU'):
+        self.model = IENetwork(model=path_to_model_xml, weights=os.path.splitext(path_to_model_xml)[0] + '.bin')
+
+        assert len(self.model.inputs) == 1, "Expected 1 input blob"
+
+        assert len(self.model.outputs) == 1, "Expected 1 output blob"
+
+        self._input_layer_name = next(iter(self.model.inputs))
+        self._output_layer_name = next(iter(self.model.outputs))
+        self.CHANNELS_SIZE = 3
+        self.OUTPUT_CHANNELS_SIZE = 17
+
+        assert len(self.model.inputs[self._input_layer_name].shape) == 4 and \
+               self.model.inputs[self._input_layer_name].shape[1] == self.CHANNELS_SIZE,\
+               "Expected model input blob with shape [1, 3, H, W]"
+
+        assert len(self.model.outputs[self._output_layer_name].shape) == 4 and \
+               self.model.outputs[self._output_layer_name].shape[1] == self.OUTPUT_CHANNELS_SIZE,\
+            "Expected model output shape [1, %s, H, W]" % (self.OUTPUT_CHANNELS_SIZE)
+
+        self._ie = ie
+        self._exec_model = self._ie.load_network(self.model, device)
+        self._scale = scale
+        self._thr = thr
+
+        _, _, self.input_h, self.input_w = self.model.inputs[self._input_layer_name].shape
+        _, _, self.output_h, self.output_w = self.model.outputs[self._output_layer_name].shape
+        self._transform = TransformedCrop(self.input_h, self.input_w, self.output_h, self.output_w)
+        self.infer_time = -1
+
+    def _preprocess(self, img, bbox):
+        return self._transform(img, bbox)
+
+    def _infer(self, prep_img):
+        t0 = cv2.getTickCount()
+        output = self._exec_model.infer(inputs={self._input_layer_name: prep_img})
+        self.infer_time = ((cv2.getTickCount() - t0) / cv2.getTickFrequency())
+        return output[self._output_layer_name][0]
+
+    @staticmethod
+    def _postprocess(heatmaps, rev_trans):
+        all_keypoints = [extract_keypoints(heatmap) for heatmap in heatmaps]
+        all_keypoints_transformed = [affine_transform([kp[1][0], kp[1][1]], rev_trans) for kp in all_keypoints]
+
+        return all_keypoints_transformed
+
+    def estimate(self, img, bbox):
+        rev_trans, preprocessed_img = self._preprocess(img, bbox)
+        heatmaps = self._infer(preprocessed_img)
+        keypoints = self._postprocess(heatmaps, rev_trans)
+        return keypoints
diff --git a/demos/python_demos/single_human_pose_estimation_demo/models.lst b/demos/python_demos/single_human_pose_estimation_demo/models.lst
new file mode 100644
index 00000000000..896e1681088
--- /dev/null
+++ b/demos/python_demos/single_human_pose_estimation_demo/models.lst
@@ -0,0 +1,11 @@
+# This file can be used with the --list option of the model downloader.
+mobilenet-ssd
+pedestrian-and-vehicle-detector-adas-????
+pedestrian-detection-adas-????
+pedestrian-detection-adas-binary-????
+person-detection-retail-0013
+person-vehicle-bike-detection-crossroad-????
+single-human-pose-estimation-????
+ssd???
+ssd_mobilenet_v?_*
+ssdlite_mobilenet_v2
diff --git a/demos/python_demos/single_human_pose_estimation_demo/single_human_pose_estimation_demo.py b/demos/python_demos/single_human_pose_estimation_demo/single_human_pose_estimation_demo.py
new file mode 100644
index 00000000000..03899cd12f9
--- /dev/null
+++ b/demos/python_demos/single_human_pose_estimation_demo/single_human_pose_estimation_demo.py
@@ -0,0 +1,107 @@
+import argparse
+import cv2
+
+from openvino.inference_engine import IECore
+
+from detector import Detector
+from estimator import HumanPoseEstimator
+
+def build_argparser():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("-m_od", "--model_od", type=str, required=True,
+                        help="path to model of object detector in xml format")
+
+    parser.add_argument("-m_hpe", "--model_hpe", type=str, required=True,
+                        help="path to model of human pose estimator in xml format")
+
+    parser.add_argument("-i", "--input", type=str, nargs='+', default='', help="path to video or image/images")
+    parser.add_argument("-d", "--device", type=str, default='CPU', required=False,
+                        help="Specify the target to infer on CPU or GPU")
+    parser.add_argument("--person_label", type=int, required=False, default=15, help="Label of class person for detector")
+    parser.add_argument("--no_show", help='Optional. Do not display output.', action='store_true')
+
+    return parser
+
+class ImageReader(object):
+    def __init__(self, file_names):
+        self.file_names = file_names
+        self.max_idx = len(file_names)
+
+    def __iter__(self):
+        self.idx = 0
+        return self
+
+    def __next__(self):
+        if self.idx == self.max_idx:
+            raise StopIteration
+        img = cv2.imread(self.file_names[self.idx], cv2.IMREAD_COLOR)
+        if img.size == 0:
+            raise IOError('Image {} cannot be read'.format(self.file_names[self.idx]))
+        self.idx += 1
+        return img
+
+
+class VideoReader(object):
+    def __init__(self, file_name):
+        try:
+            self.file_name = int(file_name[0])
+        except:
+            self.file_name = file_name[0]
+
+
+    def __iter__(self):
+        self.cap = cv2.VideoCapture(self.file_name)
+        if not self.cap.isOpened():
+            raise IOError('Video {} cannot be opened'.format(self.file_name))
+        return self
+
+    def __next__(self):
+        was_read, img = self.cap.read()
+        if not was_read:
+            raise StopIteration
+        return img
+
+
+def run_demo(args):
+    ie = IECore()
+    detector_person = Detector(ie, path_to_model_xml=args.model_od,
+                              device=args.device,
+                              label_class=args.person_label)
+
+    single_human_pose_estimator = HumanPoseEstimator(ie, path_to_model_xml=args.model_hpe,
+                                                  device=args.device)
+    if args.input != '':
+        img = cv2.imread(args.input[0], cv2.IMREAD_COLOR)
+        frames_reader, delay = (VideoReader(args.input), 1) if img is None else (ImageReader(args.input), 0)
+    else:
+        raise ValueError('--input has to be set')
+
+    for frame in frames_reader:
+        bboxes = detector_person.detect(frame)
+        human_poses = [single_human_pose_estimator.estimate(frame, bbox) for bbox in bboxes]
+
+        colors = [(0, 0, 255),
+                  (255, 0, 0), (0, 255, 0), (255, 0, 0), (0, 255, 0),
+                  (255, 0, 0), (0, 255, 0), (255, 0, 0), (0, 255, 0),
+                  (255, 0, 0), (0, 255, 0), (255, 0, 0), (0, 255, 0),
+                  (255, 0, 0), (0, 255, 0), (255, 0, 0), (0, 255, 0)]
+
+        for pose, bbox in zip(human_poses, bboxes):
+            cv2.rectangle(frame, (bbox[0], bbox[1]), (bbox[0] + bbox[2], bbox[1] + bbox[3]), (255, 0, 0), 2)
+            for id_kpt, kpt in enumerate(pose):
+                cv2.circle(frame, (int(kpt[0]), int(kpt[1])), 3, colors[id_kpt], -1)
+
+        cv2.putText(frame, 'summary: {:.1f} FPS (estimation: {:.1f} FPS / detection: {:.1f} FPS)'.format(
+            float(1 / (detector_person.infer_time + single_human_pose_estimator.infer_time * len(human_poses))),
+            float(1 / single_human_pose_estimator.infer_time),
+            float(1 / detector_person.infer_time)), (5, 15), cv2.FONT_HERSHEY_COMPLEX, 0.5, (0, 0, 200))
+        if args.no_show:
+            continue
+        cv2.imshow('Human Pose Estimation Demo', frame)
+        key = cv2.waitKey(delay)
+        if key == 27:
+            return
+
+if __name__ == "__main__":
+    args = build_argparser().parse_args()
+    run_demo(args)
diff --git a/demos/python_demos/smart_library_demo/README.md b/demos/python_demos/smart_library_demo/README.md
new file mode 100644
index 00000000000..65e82c601a0
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/README.md
@@ -0,0 +1,136 @@
+# Smart Library Demo
+
+The applicattion is a demo of automated “smart library”. 
+It involves the registration of the reader; authorization of the reader through face recognition; 
+receiving and returning books by recognizing QR codes generated for each book in the library. 
+The following pretrained models can be used:
+
+* `face-detection-retail-0004`, to detect faces and predict their bounding boxes;
+* `landmarks-regression-retail-0009`, to predict face keypoints;
+* `face-reidentification-retail-0095`, to recognize readers.
+
+For more information about the pre-trained models, refer to the [model documentation](../../../models/intel/index.md).
+
+### How it works
+
+The application is started from command line.
+It reads video stream frame-by-frame from a web-camera device and performs independent analysis
+of each frame. To make predictions the application uses 3 models. An input frame is processed by
+the face detection model to detect bounding boxes. Then face keypoints
+are predicted by the facial landmarks regression model. Keypoints are using
+to align the face and match it with face in data base. 
+To register in library press `r` on keyboard. Once reader has beeen registered, he will be autothorized 
+through face recognition. Registration allows to receiving and returning books by recognizing QR codes for 
+each book. To make book recognition press `b` on keyboard. Also application provides some 
+extra statictics in console, like list of registered readers, full list of books in the library,
+history of borrowing books. To change information in console press `f` on keyboard. To exit press `q`.
+
+### Installation and dependencies
+
+The demo depends on:
+- OpenVINO toolkit (2019R3 or newer)
+- Python (any of 2.7+ or 3.4+, which is supported by OpenVINO)
+- OpenCV (>=3.4.0)
+
+To install all the required Python modules you can use:\
+'''
+pip install -r requirements.txt 
+'''
+
+### Creating QR-codes for books
+
+Next two files are using to create QR-codes for books:
+* `library.json` file contains information about books in the library. 
+* `createQRCodes.py` script generates QR-codes for each book in `library.json` file.
+
+``` sh
+usage: createQRCodes.py [-h] [-i LIB] [-o OUT]
+
+optional arguments:
+  -h, --help  show this help message and exit
+  -i LIB      unput `.json` file with info
+  -o OUT      directory to save generated QR-codes
+```
+
+### Running the demo
+
+Running the application with the `-h` option or without
+any arguments yields the following message:
+
+``` sh
+python ./smart_library_demo.py -h
+
+usage: smart_library_demo.py [-h] -fr FREC -m_rd RDMODEL -fd FDDET -m_fd
+                             FDMODEL -lm LMDET -m_lm LMMODEL [-w_rd RDWIDTH]
+                             [-h_rd RDHEIGHT] [-t_rd RDTHRESHOLD]
+                             [-w_fd FDWIDTH] [-h_fd FDHEIGHT]
+                             [-t_fd FDTHRESHOLD] [-w_lm LMWIDTH]
+                             [-h_lm LMHEIGHT] [-br BR] [-lib LIB] [-w WEB]
+
+Smart Library Sample
+
+Optional arguments:
+  -h, --help         show this help message and exit
+  -w_rd RDWIDTH      Optional. Image width to resize
+  -h_rd RDHEIGHT     Optional. Image height to resize
+  -t_rd RDTHRESHOLD  Optional. Probability threshold for face detections.
+  -w_fd FDWIDTH      Optional. Image width to resize
+  -h_fd FDHEIGHT     Optional. Image height to resize
+  -t_fd FDTHRESHOLD  Optional. Probability threshold for face detections.
+  -w_lm LMWIDTH      Optional. Image width to resize
+  -h_lm LMHEIGHT     Optional. Image height to resize
+  -br BR             Optional. Type - QR
+  -lib LIB           Optional. Path to library.
+  -w WEB             Optional. Specify index of web-camera to open. Default is
+                     0
+
+Models:
+  -fr FREC           Required. Type of recognizer. Available DNN face
+                     recognizer - DNNfr
+  -m_rd RDMODEL      Required. Path to .xml file
+  -fd FDDET          Required. Type of detector. Available DNN face detector -
+                     DNNfd
+  -m_fd FDMODEL      Required. Path to .xml file
+  -lm LMDET          Required. Type of detector. Available DNN landmarks
+                     regression - DNNlm
+  -m_lm LMMODEL      Required. Path to .xml file
+```
+
+Example of a valid command line to run the application:
+
+Linux (`sh`, `bash`, ...) (assuming OpenVINO installed in `/opt/intel/openvino`):
+
+``` sh
+# Set up the environment
+source /opt/intel/openvino/bin/setupvars.sh
+
+python ./smart_library_demo.py \
+-fr=DNNfr \
+-m_rd=<path_to_model>/face-reidentification-retail-0095.xml \
+-fd=DNNfd -m_fd=<path_to_model>/face-detection-retail-0004.xml  \
+-lm=DNNlm \
+-m_lm=<path_to_model>/landmarks-regression-retail-0009.xml \
+```
+
+Windows (`cmd`, `powershell`) (assuming OpenVINO installed in `C:/Program Files (x86)/IntelSWTools/openvino/`):
+
+``` powershell
+# Set up the environment
+call C:/Program Files (x86)/IntelSWTools/openvino_2019.3.334/bin/setupvars.bat
+
+python smart_library_demo.py  -fr=DNNfr -m_rd=<path_to_model>/face-reidentification-retail-0095.xml 
+                              -fd=DNNfd -m_fd=<path_to_model>/face-detection-retail-0004.xml 
+                              -lm=DNNlm -m_lm=<path_to_model>/landmarks-regression-retail-0009.xml
+```
+Notice that the custom networks should be converted to the
+Inference Engine format (*.xml + *bin) first. To do this use the
+[Model Optimizer](https://software.intel.com/en-us/articles/OpenVINO-ModelOptimizer) tool.
+
+### Demo output
+
+The demo uses OpenCV window to display the resulting video frame and detections.
+It outputs logs to the terminal.
+
+## See also
+
+* [Using Inference Engine Demos](../../README.md)
diff --git a/demos/python_demos/smart_library_demo/createQRCodes.py b/demos/python_demos/smart_library_demo/createQRCodes.py
new file mode 100644
index 00000000000..ccbe44b67ff
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/createQRCodes.py
@@ -0,0 +1,38 @@
+import sys, os
+import argparse
+import json
+sys.path.append("src/modules")
+import QR_generator as qr
+
+
+def createArgparse():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('-i', type=str, dest = 'lib',  default='library.json')
+    parser.add_argument('-o', type=str, dest = 'out',  default='qr-codes')
+    return parser.parse_args()
+
+def main():
+    args = createArgparse()
+    gen = qr.QRgenerator()
+    if (args.lib != None and  os.path.isfile(args.lib) and args.out != None ):
+        try:
+            os.mkdir(args.out)
+        except OSError:
+            print ("Creation of the directory %s failed" % args.out)
+        else:
+            print ("Successfully created the directory %s " % args.out)
+            with open(args.lib, 'r', encoding='utf-8') as lib:
+                data = json.load(lib)
+            
+            for book in data['books']:
+                strData = (str(book['id'])+ ' ' + book['title'] + ' ' + 
+                        book['author'] + ' ' + book['publisher'] + ' ' +
+                        str(book['year']))
+                qr = gen.makeQR(strData)
+                print(strData)
+                qr.save(args.out + '/' + str(book['id']) + '.png')
+    else:
+        print('File or directory not exists!')
+
+if __name__ == '__main__':
+    sys.exit(main() or 0)
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/library.json b/demos/python_demos/smart_library_demo/library.json
new file mode 100644
index 00000000000..40a206f2c18
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/library.json
@@ -0,0 +1,19 @@
+{
+    "books": 
+    [
+        {
+            "id": 1,
+            "title": "book 1",
+            "author": "Author 1, Author 2",
+            "publisher": "pub",
+            "year": 2018
+        },
+        {
+            "id": 2,
+            "title": "book 2",
+            "author": "Author 1, Author 2",
+            "publisher": "pub",
+            "year": 2017
+        } 
+    ]
+}
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/models.lst b/demos/python_demos/smart_library_demo/models.lst
new file mode 100644
index 00000000000..90ff11b3642
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/models.lst
@@ -0,0 +1,5 @@
+# This file can be used with the --list option of the model downloader.
+face-detection-retail-????
+face-reidentification-retail-????
+landmarks-regression-retail-????
+
diff --git a/demos/python_demos/smart_library_demo/requirements.txt b/demos/python_demos/smart_library_demo/requirements.txt
new file mode 100644
index 00000000000..21f35ce0811
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/requirements.txt
@@ -0,0 +1,2 @@
+pyzbar>=0.1.8
+qrcode>=6.1
diff --git a/demos/python_demos/smart_library_demo/smart_library_demo.py b/demos/python_demos/smart_library_demo/smart_library_demo.py
new file mode 100644
index 00000000000..7c955fe0d3c
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/smart_library_demo.py
@@ -0,0 +1,252 @@
+import sys, os
+import argparse
+import numpy as np
+import cv2 as cv
+import json
+
+sys.path.insert(0,'src/modules')
+import face_recognizer as fr 
+import book_recognizer as br
+
+sys.path.insert(0, 'src/infrastructure')
+from DynamicDatabase import *
+
+uknownID = -1
+count = 0
+
+def CreateArgparse():
+    parser = argparse.ArgumentParser(description='Smart Library Sample') 
+    parser.add_argument('-fr', type = str,
+                        dest = 'fRec', required=True, 
+                        help = 'Required. \
+                        Type of recognizer. \
+                        Available DNN face recognizer - DNNfr')
+    parser.add_argument('-m_rd', type = str, 
+                        dest = 'rdModel', required=True,  
+                        help = 'Required. Path to .xml file')        
+    parser.add_argument('-fd', type = str, 
+                        dest = 'fdDet', required=True, 
+                        help = 'Required. \
+                        Type of detector. \
+                        Available DNN face detector - DNNfd')          
+    parser.add_argument('-m_fd', type = str, 
+                        dest = 'fdModel', required=True, 
+                        help = 'Required. Path to .xml file')
+    parser.add_argument('-lm', type = str, dest = 'lmDet', required=True,
+                        help = 'Required. \
+                        Type of detector. \
+                        Available DNN landmarks regression - DNNlm')
+    parser.add_argument('-m_lm', type = str, 
+                        dest = 'lmModel', required=True, 
+                        help = 'Required. \
+                        Path to .xml file')    
+    parser.add_argument('-w_rd', type = int, default = 128,
+                        dest = 'rdWidth',
+                        help = 'Optional. Image width to resize')
+    parser.add_argument('-h_rd', type = int, default = 128,
+                        dest = 'rdHeight',
+                        help = 'Optional. Image height to resize') 
+    parser.add_argument('-t_rd', type = float, default = 0.8,
+                        dest = 'rdThreshold',
+                        help = 'Optional. \
+                         Probability threshold for face detections.')
+    parser.add_argument('-w_fd', type = int, default = 300,
+                        dest = 'fdWidth',
+                        help = 'Optional. Image width to resize')
+    parser.add_argument('-h_fd', type = int, default = 300,
+                        dest = 'fdHeight',
+                        help = 'Optional. Image height to resize') 
+    parser.add_argument('-t_fd', type = float, default = 0.9,
+                        dest = 'fdThreshold',
+                        help = 'Optional. \
+                        Probability threshold for face detections.')
+    parser.add_argument('-w_lm', type = int, default = 48,
+                        dest = 'lmWidth',
+                        help = 'Optional. Image width to resize')
+    parser.add_argument('-h_lm', type = int, default = 48,
+                        dest = 'lmHeight',
+                        help = 'Optional. Image height to resize') 
+    parser.add_argument('-br', type = str,  default = 'QR',
+                        dest = 'br',
+                        help = 'Optional. Type - QR')
+    parser.add_argument('-lib', type = str, default = 'library.json',
+                        dest = 'lib',
+                        help = 'Optional. Path to library.') 
+    parser.add_argument('-w', type = int, default = 0,
+                        dest = 'web',
+                        help = 'Optional.\
+                        Specify index of web-camera to open. Default is 0')
+    args = parser.parse_args()
+    return args
+
+def CreateLibrary(libPath, DB):
+    with open(libPath, 'r', encoding='utf-8') as lib:
+        data = json.load(lib)
+    for book in data['books']:
+        DB.addBook(book['id'], book['title'],  book['author'],
+                   book['publisher'], book['year'])
+
+def PutText(img, text, pos, ix, iy, font, color, scale, thickness, rect = 1):
+
+    textSize = cv.getTextSize(text, font, scale, thickness) 
+    if rect:
+        cv.rectangle(img, pos, (textSize[0][0] + ix, 
+                pos[1] - textSize[0][1] + iy), (255, 255, 255), cv.FILLED)
+    cv.putText(img, text, (pos[0], pos[1] + iy),
+                font, scale, color, thickness)
+
+def PutInfo(img):
+    indent = 10
+    text = 'Show book'
+    PutText(img, text, (5,  img.shape[0]), 5, -5, cv.FONT_HERSHEY_SIMPLEX, 
+            (22, 163, 245), 1, 2)
+
+    text = 'Press:'
+    PutText(img, text, (5,  indent), 0, 0, cv.FONT_HERSHEY_PLAIN, 
+            (22, 163, 245), 1, 1, 0)
+    txtSize = cv.getTextSize(text, cv.FONT_HERSHEY_PLAIN, 1, 2) 
+
+    indent += txtSize[0][1] + 5
+    text = 'r - register'
+    PutText(img, text, (5,  indent), 0, 0, cv.FONT_HERSHEY_PLAIN, 
+                        (22, 163, 245), 1, 1, 0)
+    txtSize = cv.getTextSize(text, cv.FONT_HERSHEY_PLAIN , 1, 1) 
+
+    indent += txtSize[0][1] + 5
+    text = 'b - to get or ret a book'
+    txtSize = cv.getTextSize(text, cv.FONT_HERSHEY_PLAIN , 1, 1) 
+    PutText(img, text, (5,  indent), 0, 0, cv.FONT_HERSHEY_PLAIN, 
+            (22, 163, 245), 1, 1, 0)
+
+    indent += txtSize[0][1] + 5
+    text = 'f - get info' 
+    txtSize = cv.getTextSize(text, cv.FONT_HERSHEY_PLAIN , 1, 1)
+    PutText(img, text, (5,  indent), 0, 0, cv.FONT_HERSHEY_PLAIN, 
+            (22, 163, 245), 1, 1, 0)
+
+def RecognizeUser(img, faceRec):
+    faces, out = faceRec.recognize(img)
+    userID = uknownID
+    for face in faces:
+        if len(faces) > 1:
+            text = 'No more than one person at a time'
+            PutText(img, text, (0,30), 0, -5, cv.FONT_HERSHEY_SIMPLEX, 
+                                           (22, 163, 245), 1, 2)
+
+        if np.amax(out) > faceRec.threshold:
+            userID = int(np.argmax(out) + 1)
+            text = 'User #' + str(userID)
+            PutText(img, text, face[0], face[0][0], -5, cv.FONT_HERSHEY_SIMPLEX, 
+                                           (22, 163, 245), 1, 2)
+        else:
+            text = 'Unknown'
+            PutText(img, text, face[0], face[0][0], -5, cv.FONT_HERSHEY_SIMPLEX, 
+                                           (22, 163, 245), 1, 2)     
+        cv.rectangle(img, face[0], face[1], (22, 163, 245), 2)
+    return userID
+
+def PrintInfo(count, DB):
+    os.system('cls')
+    if count == 0:
+        DB.printUsers()
+    elif count == 1:
+        DB.printBooks()
+    elif count == 2:
+        DB.printBBooks()
+
+def RecognizeBook(img, bookRec):
+    data = bookRec.recognize(img)
+    try: 
+        bID = int(data.split(' ')[0])
+        print(bID)
+        return bID 
+    except ValueError:
+        return -1
+
+def main():
+    args = CreateArgparse()
+    brArgs = dict(name='')
+    rdArgs = dict(name = '', rdXML = '', rdWidth= 0, rdHeight= 0, 
+                  rdThreshold= 0, fdName = '', fdXML = '', fdWidth = 0,
+                  fdThreshold= 0, lmName = '', lmXML= 0, 
+                  lmWidth= 0, lmHeight= 0)
+
+    DB = DynamicDB()
+    if (args.fRec != None and args.fdDet != None and args.lmDet != None):
+        rdArgs['name'] = args.fRec
+        print(args)
+        if (args.rdModel != None):
+            rdArgs['rdXML'] = args.rdModel
+        if (args.rdWidth != None):
+            rdArgs['rdWidth'] = args.rdWidth
+        if (args.rdHeight != None):
+            rdArgs['rdHeight'] = args.rdHeight
+        if (args.rdThreshold != None):
+            rdArgs['rdThreshold'] = args.rdThreshold
+
+        rdArgs['fdName'] = args.fdDet
+        if (args.fdModel != None):
+            rdArgs['fdXML'] = args.fdModel
+        if (args.fdWidth != None):
+            rdArgs['fdWidth'] = args.fdWidth
+        if (args.fdHeight != None):
+            rdArgs['fdHeight'] = args.fdHeight
+        if (args.fdThreshold != None):
+            rdArgs['fdThreshold'] = args.fdThreshold
+
+        rdArgs['lmName'] = args.lmDet
+        if (args.lmModel != None):
+            rdArgs['lmXML'] = args.lmModel
+        if (args.lmWidth != None):
+            rdArgs['lmWidth'] = args.lmWidth
+        if (args.lmWidth != None):
+            rdArgs['lmHeight'] = args.lmHeight
+        if (args.br != None): 
+            brArgs['name'] = args.br
+        if (args.br != None): 
+            lib = args.lib
+        if (args.web != None): 
+            src = args.web
+        
+        CreateLibrary(lib, DB)
+        bookRec = br.BookRecognizer.create(brArgs)
+        faceRec = fr.FaceRecognizer.create(rdArgs)
+        cap = cv.VideoCapture(src)
+        count = 0
+        while(True):
+            _, img = cap.read()
+            ch = cv.waitKey(5) & 0xFF
+            userID = RecognizeUser(img, faceRec)   
+    
+            if userID != uknownID:
+                PutInfo(img)
+                if ch == ord('b'):
+                    bookID = RecognizeBook(img, bookRec)
+                    os.system('cls')
+                    print(bookID)
+                    DB.getRetBook(userID, bookID)
+                    DB.printBBooks()
+                
+            elif ch  == ord('r'):
+                n = faceRec.register(img)
+                DB.addUser(n)
+                text = 'You are user #' +  str(n)
+                PutText(img, text, (5,  25), 5, -5, cv.FONT_HERSHEY_SIMPLEX, 
+                                            (22, 163, 245), 1, 2)
+                os.system('cls')
+                DB.printUsers()
+                cv.imshow('window',  img)
+                cv.waitKey(1000)
+            
+            cv.imshow('window',  img)
+            if ch == ord('f'):
+                count = count + 1 
+                PrintInfo(count % 3, DB)
+
+            if ch == ord('q'):
+                break
+
+        cap.release()
+        
+if __name__ == '__main__':
+    sys.exit(main() or 0)
diff --git a/demos/python_demos/smart_library_demo/src/__init__.py b/demos/python_demos/smart_library_demo/src/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/DynamicDatabase.py b/demos/python_demos/smart_library_demo/src/infrastructure/DynamicDatabase.py
new file mode 100644
index 00000000000..df6d3798007
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/infrastructure/DynamicDatabase.py
@@ -0,0 +1,114 @@
+from datetime import datetime, date, time
+from Entities.User import *
+from Entities.Author import *
+from Entities.Book import *
+
+class BorrowedBooks():
+    def __init__(self, bookID, userID, borrowed, bdate, rdate):
+        self.bookID = bookID
+        self.userID = userID
+        self.borrowed = borrowed
+        self.bdate = bdate
+        self.rdate = rdate
+
+class DynamicDB():
+    
+    def __init__(self):
+        self.Users = []
+        self.Books = []
+        self.BBooks = []
+
+    def addUser(self, userID):
+        user = User(userID, '', 'User# ' +str(userID), '', '')
+        user._print()
+        self.Users.append(user)
+    
+    def deleteUser(self):
+        ''' '''
+    
+    def addBook(self, bookID, title, author,  publisher, date):
+        lAuthors = []
+        authors = author.split(', ')
+        for a in authors:
+            a = a.replace('.', '')
+            names = a.split(' ')
+            if len(names) == 3:
+                lAuthors.append(Author(-1, names[0], names[2], names[1]))
+            elif len(names) == 2:
+                lAuthors.append(Author(-1, names[0], names[1], ''))
+            else:
+                Exception('Book`s authors not in correct format')
+
+        book = Book(bookID, '', title, date, publisher, lAuthors)
+        self.Books.append(book)
+    
+    def deleteBook(self):
+        ''' '''    
+     
+    def getRetBook(self, userID, bookID):
+        dateNow = str(datetime.now()).split(' ')[0]
+        find = False
+        isBorrowed = False
+
+        for book in self.BBooks:
+            if book.bookID ==  bookID:
+                if book.borrowed:
+                    find = True
+                    isBorrowed = book.borrowed
+                    if userID == book.userID:
+                        book.borrowed = not book.borrowed
+                        book.rdate = dateNow
+                        print('Book returned succesfully')
+                    else:
+                        print('This book is not on your account')
+
+        if not find and not isBorrowed:
+            for book in self.Books: 
+                if book.book_id ==  bookID:
+                        bbook = BorrowedBooks(bookID, userID, True, dateNow, '' )
+                        find = True
+                        self.BBooks.append(bbook)
+                        print("len =", len(self.BBooks))
+                        print('Book borrowed succesfully')
+        if not find:
+           print('There is no such book')
+            
+        return find
+           
+    def printUsers(self):
+        print('{:<10}{:<10}'.format('ID', 'Name'))
+        for user in self.Users:
+            print('{:<10}{:<10}'.format(user.user_id, user.first_name))
+
+
+    def printBooks(self):
+        authorsStr = ''
+        print('{:<10}{:<30}{:<40}{:<10}{:<20}'.format('ID', 'Author','Title',
+        'Publisher', 'Publication date'))
+        for book in self.Books:
+            authorsStr = ''
+            for a in book.authors:
+                if(a.middle_name != ''):
+                    authorsStr += (a.first_name[0] + '. ' +
+                                a.middle_name[0] + '. ' 
+                                + a.last_name)
+                else:
+                    authorsStr += (a.first_name[0] + '. ' + 
+                                   a.last_name)
+                if (a != book.authors[-1]):
+                    authorsStr += ', '
+
+            print('{:<10}{:<30}{:<40}{:<10}{:<20}'.format(book.book_id, authorsStr,
+                book.title, book.publisher, book.year))
+
+    def printBBooks(self):
+        print('{:<10}{:<10}{:<20}{:<40}{:<20}{:<20}'.format('User ID', 'Book ID', 'First name',
+             'Title',  'Borrow date','Return date'))
+        for bbook in self.BBooks:
+            for book in self.Books:
+                for user in self.Users:
+                    if bbook.userID == user.user_id and bbook.bookID == book.book_id:
+                        print('{:<10}{:<10}{:<20}{:<40}{:<20}{:<20}'.format(user.user_id, book.book_id,
+                                   user.first_name, book.title, bbook.bdate, bbook.rdate))
+                        
+ 
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Author.py b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Author.py
new file mode 100644
index 00000000000..eed4b586ee1
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Author.py
@@ -0,0 +1,12 @@
+class Author:
+    def __init__(self, author_id, first_name, last_name, middle_name):
+        self.author_id = author_id
+        self.first_name = first_name
+        self.last_name = last_name
+        self.middle_name = middle_name
+        
+    def _print(self):
+        print(self.author_id)
+        print(self.first_name)
+        print(self.last_name)
+        print(self.middle_name)
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Book.py b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Book.py
new file mode 100644
index 00000000000..e8fe95c598c
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/Book.py
@@ -0,0 +1,20 @@
+class Book:
+    def __init__(self, book_id, file_path, title, year, publisher, authors):
+        self.book_id = book_id
+        self.file_path = file_path
+        self.title = title
+        self.year = year
+        self.publisher = publisher
+        self.authors = authors
+        
+    def _print(self):
+        print(self.book_id)
+        print(self.file_path)
+        print(self.title)
+        print(self.year)
+        print(self.publisher)
+        print("AUTHORS:")
+        i = 0
+        for elem in self.authors:
+            (self.authors[i])._print()
+            i = i + 1
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/Entities/User.py b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/User.py
new file mode 100644
index 00000000000..39c24b31d32
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/User.py
@@ -0,0 +1,15 @@
+class User:
+    def __init__(self, user_id, phone, first_name, last_name,
+                 middle_name = None):
+        self.user_id = user_id
+        self.phone = phone
+        self.first_name = first_name
+        self.last_name = last_name
+        self.middle_name = middle_name
+        
+    def _print(self):
+        print(self.user_id)
+        print(self.phone)
+        print(self.first_name)
+        print(self.last_name)
+        print(self.middle_name)
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/Entities/__init__.py b/demos/python_demos/smart_library_demo/src/infrastructure/Entities/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/smart_library_demo/src/infrastructure/__init__.py b/demos/python_demos/smart_library_demo/src/infrastructure/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/smart_library_demo/src/modules/QR_generator.py b/demos/python_demos/smart_library_demo/src/modules/QR_generator.py
new file mode 100644
index 00000000000..d6abef91557
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/modules/QR_generator.py
@@ -0,0 +1,25 @@
+import qrcode
+
+
+class QRgenerator(object):
+
+    # Constructor
+    def __init__(self):
+        self.generator = qrcode.QRCode(
+        error_correction=qrcode.constants.ERROR_CORRECT_M)
+
+    # Creating Qr-code
+    def makeQR(self, data):
+        """Add data to this QR Code."""
+        self.generator.data_list.clear()
+        self.generator.add_data(data)
+        """
+        Compile the data into a QR Code array.
+        :param fit: If ``True`` (or if a size has not been provided), find the
+            best fit for the data to avoid data overflow errors.
+        """
+        self.generator.make(fit=True)
+        """ Make an image from the QR Code data."""
+        image = self.generator.make_image(fill_color="black", back_color="white")
+
+        return image
diff --git a/demos/python_demos/smart_library_demo/src/modules/__init__.py b/demos/python_demos/smart_library_demo/src/modules/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/smart_library_demo/src/modules/book_recognizer.py b/demos/python_demos/smart_library_demo/src/modules/book_recognizer.py
new file mode 100644
index 00000000000..f67faf06f65
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/modules/book_recognizer.py
@@ -0,0 +1,33 @@
+import cv2
+import pyzbar.pyzbar as pyzbar
+import numpy as np
+from abc import ABC, abstractmethod
+
+class BookRecognizer(ABC):
+    @staticmethod
+    def create(args):
+        if args['name'] == 'QR':
+            return QRBookRecognizer()
+        
+    @abstractmethod
+    def recognize(self, frame):
+        """Recognize book"""
+        
+class QRBookRecognizer(BookRecognizer):
+    # Constructor
+    def __init__(self):
+        self.objects = []
+
+    def recognize(self, frame):
+        # Find barcodes and QR codes
+        gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+        self.objects = pyzbar.decode(gray)
+
+        # Analise results
+        ans = ""
+        for obj in self.objects:
+            if obj.type == 'QRCODE':
+                ans = obj.data.decode('utf-8')
+
+        # Return decode information
+        return ans
\ No newline at end of file
diff --git a/demos/python_demos/smart_library_demo/src/modules/face_recognizer.py b/demos/python_demos/smart_library_demo/src/modules/face_recognizer.py
new file mode 100644
index 00000000000..22972043cc6
--- /dev/null
+++ b/demos/python_demos/smart_library_demo/src/modules/face_recognizer.py
@@ -0,0 +1,207 @@
+import sys, os
+import numpy as np
+import cv2 as cv
+
+from abc import ABC, abstractmethod
+
+refLandmarks = np.float32([[0.31556875000000000, 0.4615741071428571],  # left eye
+                           [0.68262291666666670, 0.4615741071428571],  # right eye
+                           [0.50026249999999990, 0.6405053571428571],  # tip of nose
+                           [0.34947187500000004, 0.8246919642857142],  # left lip corner, right lip corner
+                           [0.65343645833333330, 0.8246919642857142]]) # right lip corner
+
+class FaceRecognizer(ABC):
+     @staticmethod
+     def create(args): 
+        if args['name'] == 'DNNfr':
+            return DNNRecognizer(args['rdXML'],
+                   args['rdWidth'], args['rdHeight'], args['rdThreshold'], 
+                   args['fdName'], args['fdXML'], 
+                   args['fdWidth'], args['fdHeight'], args['fdThreshold'],
+                   args['lmName'], args['lmXML'],
+                   args['lmWidth'], args['lmHeight'])
+        else:
+            raise Exception('Error: wrong recognizer name')
+
+     @abstractmethod
+     def register(self, img, ID):
+         '''Register new reader'''
+
+     @abstractmethod
+     def recognize(self, img):
+         '''Recognize valid user'''
+
+class FaceDetector(ABC):
+     @staticmethod
+     def create(args):
+         if args['name'] == 'DNNfd':
+            return DNNDetector(args['modelXML'], args['width'],
+                              args['height'], args['threshold'])
+         else:
+            raise Exception('Error: wrong detector name')
+
+     @abstractmethod
+     def detect(self, img,  threshold):
+         '''Detect faces on image'''
+
+class FaceLandmarks(ABC):
+    @staticmethod
+    def create(args): 
+         if args['name'] == 'DNNlm':
+            return DNNLandmarks(args['modelXML'], args['width'],
+                                               args['height'])
+         else:
+            raise Exception('Error: wrong detector name')
+
+    @abstractmethod
+    def align(self, img, l):
+         '''Detect faces on image'''
+
+class DNNLandmarks(ABC):
+    def __init__(self, modelXML, width, height):
+        self.modelXML = modelXML
+        self.modelBIN =  os.path.splitext(self.modelXML)[0] + '.bin'
+        self.width = width
+        self.height = height
+        backendId = cv.dnn.DNN_BACKEND_INFERENCE_ENGINE
+        targetId = cv.dnn.DNN_TARGET_CPU
+        self.net = cv.dnn.readNet(self.modelBIN, self.modelXML)
+        self.net.setPreferableBackend(backendId)
+        self.net.setPreferableTarget(targetId)
+
+    def findLandmarks(self, img):
+        try:    
+            blob = cv.dnn.blobFromImage(img,  size=(self.width, self.height))
+            self.net.setInput(blob)
+            out = self.net.forward()
+            out = out.flatten()
+            landmarks = np.empty((5, 2), dtype=np.float32)
+            for i in range(5):
+                landmarks[i] = [out[2*i],out[2*i+1] ]
+            return landmarks
+        except Exception as e:
+            print('exception: ' + str(e))
+            return np.zeros((5, 2), dtype=np.float32)
+
+    def getTransform(self, src, dst):
+        col_mean_src = cv.reduce(src, 0, cv.REDUCE_AVG)
+        for row in src:
+            row-=col_mean_src[0]
+
+        col_mean_dst = cv.reduce(dst, 0, cv.REDUCE_AVG)
+        for row in dst:
+            row-=col_mean_dst[0]
+
+        mean, dev_src = cv.meanStdDev(src)
+        dev_src[0,0] = max(sys.float_info.epsilon, dev_src[0])
+        src /= dev_src[0,0]
+     
+        mean, dev_dst = cv.meanStdDev(dst)
+        dev_dst[0,0] = max(sys.float_info.epsilon, dev_dst[0])
+        dst /= dev_dst[0,0] 
+        
+        w, u, vt = cv.SVDecomp(np.dot(cv.transpose(src), dst))
+        r = cv.transpose(np.dot(u,vt))
+        m = np.empty((2, 3), dtype=np.float32)
+        m[0:2,0:2] = np.dot(r , (dev_dst[0,0] / dev_src[0,0]))
+        m[0:2,2:3] = cv.transpose(col_mean_dst) - np.dot(m[0:2,0:2], 
+                                                   cv.transpose(col_mean_src))
+        return m
+
+
+    def align(self, img, landmarks, refLandmarks):
+        aligned_face = np.copy(img)
+        refLandmarksCopy =  np.copy(refLandmarks)
+        for  point, refPoint in zip(landmarks, refLandmarksCopy):
+           point[1] = int(point[1]*img.shape[0])
+           point[0] = int(point[0]*img.shape[1])
+           refPoint[1] = int(refPoint[1]*img.shape[0])
+           refPoint[0] = int(refPoint[0]*img.shape[1])
+        m = self.getTransform(landmarks, refLandmarksCopy)
+        aligned_face = cv.warpAffine(aligned_face, m, 
+                            (aligned_face.shape[1], aligned_face.shape[0])) 
+        return aligned_face
+       
+class DNNDetector(FaceDetector):
+    def __init__(self, modelXML, width, height, threshold):
+        self.modelXML = modelXML
+        self.modelBIN = os.path.splitext(self.modelXML)[0] + '.bin'
+        self.width = width
+        self.height = height
+        self.threshold = threshold
+        backendId = cv.dnn.DNN_BACKEND_INFERENCE_ENGINE
+        targetId = cv.dnn.DNN_TARGET_CPU
+        self.net = cv.dnn.readNet(self.modelBIN, self.modelXML)
+        self.net.setPreferableBackend(backendId)
+        self.net.setPreferableTarget(targetId)
+
+    def detect(self, img):
+        blob = cv.dnn.blobFromImage(img,  size=(self.width, self.height))
+        self.net.setInput(blob)
+        out	= self.net.forward()
+        faces = []
+        for detection in out.reshape(-1, 7):
+            confidence = float(detection[2])
+            if confidence >  self.threshold:
+                xmin = int(detection[3] *  img.shape[1]) if int(detection[3] *  img.shape[1]) > 0 else 0
+                ymin = int(detection[4] *  img.shape[0]) if int(detection[4] *  img.shape[0]) > 0 else 0
+                xmax = int(detection[5] *  img.shape[1]) if int(detection[5] *  img.shape[1]) > 0 else 0
+                ymax = int(detection[6] *  img.shape[0]) if int(detection[6] *  img.shape[0]) > 0 else 0
+                faces.append(((xmin, ymin), (xmax, ymax)))
+        return faces
+
+class DNNRecognizer(FaceRecognizer):
+    def __init__(self, recXML, recWidth, recHeight, recThreshold, 
+                  detName, detXML, detWidth, detHeight, detThreshold,
+                  lmarksName, lmarksXML, lmarksWidth, lmarksHeight):
+        args = dict(name = lmarksName, modelXML = lmarksXML,
+                    width = lmarksWidth, height = lmarksHeight)
+        self.fl = FaceLandmarks.create(args)
+        args = dict(name = detName, modelXML = detXML,
+                    width = detWidth, height = detHeight, threshold = detThreshold)
+        self.det = FaceDetector.create(args)
+
+        self.bd = np.empty((0, 256), dtype=np.float32)
+        self.counter = 0 
+        self.modelXML = recXML
+        self.modelBIN = os.path.splitext(self.modelXML)[0] + '.bin'
+        self.width = recWidth
+        self.height = recHeight
+        self.threshold = recThreshold
+        backendId = cv.dnn.DNN_BACKEND_INFERENCE_ENGINE
+        targetId = cv.dnn.DNN_TARGET_CPU
+        self.net = cv.dnn.readNet(self.modelBIN, self.modelXML)
+        self.net.setPreferableBackend(backendId)
+        self.net.setPreferableTarget(targetId)
+
+    def similarity(self, fVec, refVecs):
+        refVecs =  refVecs.T  
+        if fVec.size and  refVecs.size:
+          return np.dot(fVec, refVecs)/(np.linalg.norm(fVec)*np.linalg.norm(refVecs, axis=0))
+        else:
+          return np.zeros((1, 1))
+
+    def getFeatures(self, img):
+        faces = self.det.detect(img)
+        if len(faces) == 1:
+            face = faces[0]
+            roi = img[face[0][1]:face[1][1], face[0][0]:face[1][0]]
+            landmarks = self.fl.findLandmarks(roi)
+            alignFace = self.fl.align(roi, landmarks, refLandmarks)
+            blob = cv.dnn.blobFromImage(alignFace,  size=(self.width, self.height))
+            self.net.setInput(blob)
+            out	= self.net.forward()
+            featureVec = out.flatten()
+        else:
+            featureVec = np.empty(0)
+        return (faces, featureVec)
+
+    def recognize(self, img):
+        faces, fVec = self.getFeatures(img)
+        return (faces, self.similarity(fVec, self.bd))
+    
+    def register(self, img, ID = 0):
+        _, vec = self.getFeatures(img)
+        self.bd = np.append(self.bd, [vec], axis=0)
+        self.counter = self.bd.shape[0]
+        return self.counter
diff --git a/demos/python_demos/text_spotting_demo/README.md b/demos/python_demos/text_spotting_demo/README.md
new file mode 100644
index 00000000000..0f49028b4ce
--- /dev/null
+++ b/demos/python_demos/text_spotting_demo/README.md
@@ -0,0 +1,132 @@
+# Text Spotting Python* Demo
+
+This demo shows how to run Text Spotting models. Text Spotting models allow us to simultaneously detect and recognize text.
+
+> **NOTE**: Only batch size of 1 is supported.
+
+## How It Works
+
+The demo application expects a text spotting model that is split into three parts. Every model part must be in the Intermediate Representation (IR) format.
+
+First model is Mask-RCNN like text detector with the following constraints:
+
+* Two inputs: `im_data` for input image and `im_info` for meta-information about the image (actual height, width and scale).
+* At least five outputs including:
+    * `boxes` with absolute bounding box coordinates of the input image
+    * `scores` with confidence scores for all bounding boxes
+    * `classes` with object class IDs for all bounding boxes
+    * `raw_masks` with fixed-size segmentation heat maps for all classes of all bounding boxes
+    * `text_features` with text features which are fed to Text Recognition Head further
+
+Second model is Text Recognition Encoder that takes `text_features` as input and produces `encoded text`.
+
+Third model is Text Recognition Decoder that takes `encoded text` from Text Recognition Encoder ,`previous symbol` and `hidden state`. On the first step special `Start Of Sequence (SOS)` symbol and zero `hidden state` are fed to Text Recognition Decoder. The decoder produces `symbols distribution`, `current hidden state` each step until `End Of Sequence (EOS)` symbol is generated.
+
+As input, the demo application takes a path to a single image file, a video file or a numeric ID of a web camera specified with a command-line argument `-i`.
+
+The demo workflow is the following:
+
+1. The demo application reads image/video frames one by one, resizes them to fit into the input image blob of the network (`im_data`).
+2. The `im_info` input blob passes resulting resolution and scale of a pre-processed image to the network to perform inference of Mask-RCNN-like text detector.
+3. The Text Recognition Encoder takes input from the text detector and produces output.
+4. The Text Recognition Decoder takes output from the Text Recognition Encoder output as input and produces output.
+5. The demo visualizes the resulting text spotting results. Certain command-line options affect the visualization:
+    * If you specify `--show_boxes` and `--show_scores` arguments, bounding boxes and confidence scores are also shown.
+    * By default, tracking is used to show text instance with the same color throughout the whole video.
+      It assumes more or less static scene with instances in two frames being a part of the same track if intersection over union of the masks is greater than the 0.5 threshold. To disable tracking, specify the `--no_track` argument.
+
+> **NOTE**: By default, Open Model Zoo demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html).
+
+## Running
+
+Run the application with the `-h` option to see the following usage message:
+
+```
+usage: text_spotting_demo.py [-h] -m_m "<path>" -m_te "<path>" -m_td "<path>" -i
+                             "<path>" [-d "<device>"] [-l "<absolute_path>"]
+                             [--delay "<num>"] [-pt "<num>"] [-a ALPHABET]
+                             [--trd_input_prev_symbol TRD_INPUT_PREV_SYMBOL]
+                             [--trd_input_prev_hidden TRD_INPUT_PREV_HIDDEN]
+                             [--trd_input_encoder_outputs TRD_INPUT_ENCODER_OUTPUTS]
+                             [--trd_output_symbols_distr TRD_OUTPUT_SYMBOLS_DISTR]
+                             [--trd_output_cur_hidden TRD_OUTPUT_CUR_HIDDEN]
+                             [--keep_aspect_ratio] [--no_track]
+                             [--show_scores] [--show_boxes] [-pc] [-r]
+                             [--no_show]
+
+Options:
+  -h, --help            Show this help message and exit.
+  -m_m "<path>", --mask_rcnn_model "<path>"
+                        Required. Path to an .xml file with a trained Mask-
+                        RCNN model with additional text features output.
+  -m_te "<path>", --text_enc_model "<path>"
+                        Required. Path to an .xml file with a trained text
+                        recognition model (encoder part).
+  -m_td "<path>", --text_dec_model "<path>"
+                        Required. Path to an .xml file with a trained text
+                        recognition model (decoder part).
+  -i "<path>"           Required. Path to an image, video file or a numeric
+                        camera ID.
+  -d "<device>", --device "<device>"
+                        Optional. Specify the target device to infer on: CPU,
+                        GPU, FPGA, HDDL or MYRIAD. The demo will look for a
+                        suitable plugin for device specified (by default, it
+                        is CPU).
+  -l "<absolute_path>", --cpu_extension "<absolute_path>"
+                        Required for CPU custom layers. Absolute path to a
+                        shared library with the kernels implementation.
+  --delay "<num>"       Optional. Interval in milliseconds of waiting for a
+                        key to be pressed.
+  -pt "<num>", --prob_threshold "<num>"
+                        Optional. Probability threshold for detections
+                        filtering.
+  -a ALPHABET, --alphabet ALPHABET
+                        Optional. Alphabet that is used for decoding.
+  --trd_input_prev_symbol TRD_INPUT_PREV_SYMBOL
+                        Optional. Name of previous symbol input node to text
+                        recognition head decoder part.
+  --trd_input_prev_hidden TRD_INPUT_PREV_HIDDEN
+                        Optional. Name of previous hidden input node to text
+                        recognition head decoder part.
+  --trd_input_encoder_outputs TRD_INPUT_ENCODER_OUTPUTS
+                        Optional. Name of encoder outputs input node to text
+                        recognition head decoder part.
+  --trd_output_symbols_distr TRD_OUTPUT_SYMBOLS_DISTR
+                        Optional. Name of symbols distribution output node
+                        from text recognition head decoder part.
+  --trd_output_cur_hidden TRD_OUTPUT_CUR_HIDDEN
+                        Optional. Name of current hidden output node from text
+                        recognition head decoder part.
+  --keep_aspect_ratio   Optional. Force image resize to keep aspect ratio.
+  --no_track            Optional. Disable tracking.
+  --show_scores         Optional. Show detection scores.
+  --show_boxes          Optional. Show bounding boxes.
+  -pc, --perf_counts    Optional. Report performance counters.
+  -r, --raw_output_message
+                        Optional. Output inference results raw values.
+  --no_show             Optional. Don't show output
+```
+
+Running the application with an empty list of options yields the short version of the usage message and an error message.
+
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+
+> **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (`*.xml` + `*.bin`) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
+
+To run the demo, please provide paths to the model in the IR format and to an input video, image, or folder with images:
+```bash
+python3 text_spotting_demo.py \
+-m_m <path_to_models>/text-spotting-0001-detector.xml \
+-m_te <path_to_models>/text-spotting-0001-recognizer-encoder.xml \
+-m_td <path_to_models>/text-spotting-0001-recognizer-decoder.xml \
+-i input_image.jpg
+```
+
+## Demo Output
+
+The application uses OpenCV to display resulting text instances and current inference performance.
+
+## See Also
+* [Using Open Model Zoo demos](../../README.md)
+* [Model Optimizer](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html)
+* [Model Downloader](../../../tools/downloader/README.md)
diff --git a/demos/python_demos/text_spotting_demo/models.lst b/demos/python_demos/text_spotting_demo/models.lst
new file mode 100644
index 00000000000..6bd0dbb5f77
--- /dev/null
+++ b/demos/python_demos/text_spotting_demo/models.lst
@@ -0,0 +1,2 @@
+# This file can be used with the --list option of the model downloader.
+text-spotting-*
diff --git a/demos/python_demos/text_spotting_demo/text_spotting_demo.py b/demos/python_demos/text_spotting_demo/text_spotting_demo.py
new file mode 100644
index 00000000000..d04c1b4517b
--- /dev/null
+++ b/demos/python_demos/text_spotting_demo/text_spotting_demo.py
@@ -0,0 +1,384 @@
+#!/usr/bin/env python
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from __future__ import print_function
+
+import logging as log
+import os
+import sys
+import time
+from argparse import ArgumentParser, SUPPRESS
+
+import cv2
+import numpy as np
+from openvino.inference_engine import IENetwork, IECore
+
+from text_spotting_demo.tracker import StaticIOUTracker
+from text_spotting_demo.visualizer import Visualizer
+
+SOS_INDEX = 0
+EOS_INDEX = 1
+MAX_SEQ_LEN = 28
+
+class FolderCapture:
+    def __init__(self, path):
+        self.images_paths = []
+        self.current_index = 0
+        for imname in os.listdir(path):
+            if imname.lower().endswith('.jpg') or imname.lower().endswith('.png'):
+                self.images_paths.append(os.path.join(path, imname))
+
+    def read(self):
+        ret = False
+        image = None
+        if self.current_index < len(self.images_paths):
+            image = cv2.imread(self.images_paths[self.current_index])
+            ret = True
+            self.current_index += 1
+
+        return ret, image
+
+    def isOpened(self):
+        return len(self.images_paths) > 0
+
+    def release(self):
+        self.images_paths = []
+
+def build_argparser():
+    parser = ArgumentParser(add_help=False)
+    args = parser.add_argument_group('Options')
+    args.add_argument('-h', '--help', action='help', default=SUPPRESS,
+                      help='Show this help message and exit.')
+    args.add_argument('-m_m', '--mask_rcnn_model',
+                      help='Required. Path to an .xml file with a trained Mask-RCNN model with '
+                           'additional text features output.',
+                      required=True, type=str, metavar='"<path>"')
+    args.add_argument('-m_te', '--text_enc_model',
+                      help='Required. Path to an .xml file with a trained text recognition model '
+                           '(encoder part).',
+                      required=True, type=str, metavar='"<path>"')
+    args.add_argument('-m_td', '--text_dec_model',
+                      help='Required. Path to an .xml file with a trained text recognition model '
+                           '(decoder part).',
+                      required=True, type=str, metavar='"<path>"')
+    args.add_argument('-i',
+                      dest='input_source',
+                      help='Required. Path to an image, video file or a numeric camera ID.',
+                      required=True, type=str, metavar='"<path>"')
+    args.add_argument('-d', '--device',
+                      help='Optional. Specify the target device to infer on: CPU, GPU, FPGA, HDDL or MYRIAD. '
+                           'The demo will look for a suitable plugin for device specified '
+                           '(by default, it is CPU).',
+                      default='CPU', type=str, metavar='"<device>"')
+    args.add_argument('-l', '--cpu_extension',
+                      help='Required for CPU custom layers. '
+                           'Absolute path to a shared library with the kernels implementation.',
+                      default=None, type=str, metavar='"<absolute_path>"')
+    args.add_argument('--delay',
+                      help='Optional. Interval in milliseconds of waiting for a key to be pressed.',
+                      default=0, type=int, metavar='"<num>"')
+    args.add_argument('-pt', '--prob_threshold',
+                      help='Optional. Probability threshold for detections filtering.',
+                      default=0.5, type=float, metavar='"<num>"')
+    args.add_argument('-a', '--alphabet',
+                      help='Optional. Alphabet that is used for decoding.',
+                      default='  0123456789abcdefghijklmnopqrstuvwxyz')
+    args.add_argument('--trd_input_prev_symbol',
+                      help='Optional. Name of previous symbol input node to text recognition head decoder part.',
+                      default='prev_symbol')
+    args.add_argument('--trd_input_prev_hidden',
+                      help='Optional. Name of previous hidden input node to text recognition head decoder part.',
+                      default='prev_hidden')
+    args.add_argument('--trd_input_encoder_outputs',
+                      help='Optional. Name of encoder outputs input node to text recognition head decoder part.',
+                      default='encoder_outputs')
+    args.add_argument('--trd_output_symbols_distr',
+                      help='Optional. Name of symbols distribution output node from text recognition head decoder part.',
+                      default='output')
+    args.add_argument('--trd_output_cur_hidden',
+                      help='Optional. Name of current hidden output node from text recognition head decoder part.',
+                      default='hidden')
+    args.add_argument('--keep_aspect_ratio',
+                      help='Optional. Force image resize to keep aspect ratio.',
+                      action='store_true')
+    args.add_argument('--no_track',
+                      help='Optional. Disable tracking.',
+                      action='store_true')
+    args.add_argument('--show_scores',
+                      help='Optional. Show detection scores.',
+                      action='store_true')
+    args.add_argument('--show_boxes',
+                      help='Optional. Show bounding boxes.',
+                      action='store_true')
+    args.add_argument('-pc', '--perf_counts',
+                      help='Optional. Report performance counters.',
+                      action='store_true')
+    args.add_argument('-r', '--raw_output_message',
+                      help='Optional. Output inference results raw values.',
+                      action='store_true')
+    args.add_argument("--no_show",
+                      help="Optional. Don't show output",
+                      action='store_true')
+    return parser
+
+
+def expand_box(box, scale):
+    w_half = (box[2] - box[0]) * .5
+    h_half = (box[3] - box[1]) * .5
+    x_c = (box[2] + box[0]) * .5
+    y_c = (box[3] + box[1]) * .5
+    w_half *= scale
+    h_half *= scale
+    box_exp = np.zeros(box.shape)
+    box_exp[0] = x_c - w_half
+    box_exp[2] = x_c + w_half
+    box_exp[1] = y_c - h_half
+    box_exp[3] = y_c + h_half
+    return box_exp
+
+
+def segm_postprocess(box, raw_cls_mask, im_h, im_w):
+    # Add zero border to prevent upsampling artifacts on segment borders.
+    raw_cls_mask = np.pad(raw_cls_mask, ((1, 1), (1, 1)), 'constant', constant_values=0)
+    extended_box = expand_box(box, raw_cls_mask.shape[0] / (raw_cls_mask.shape[0] - 2.0)).astype(int)
+    w, h = np.maximum(extended_box[2:] - extended_box[:2] + 1, 1)
+    x0, y0 = np.clip(extended_box[:2], a_min=0, a_max=[im_w, im_h])
+    x1, y1 = np.clip(extended_box[2:] + 1, a_min=0, a_max=[im_w, im_h])
+
+    raw_cls_mask = cv2.resize(raw_cls_mask, (w, h)) > 0.5
+    mask = raw_cls_mask.astype(np.uint8)
+    # Put an object mask in an image mask.
+    im_mask = np.zeros((im_h, im_w), dtype=np.uint8)
+    im_mask[y0:y1, x0:x1] = mask[(y0 - extended_box[1]):(y1 - extended_box[1]),
+                            (x0 - extended_box[0]):(x1 - extended_box[0])]
+    return im_mask
+
+
+def main():
+    log.basicConfig(format='[ %(levelname)s ] %(message)s', level=log.INFO, stream=sys.stdout)
+    args = build_argparser().parse_args()
+
+    mask_rcnn_model_xml = args.mask_rcnn_model
+    mask_rcnn_model_bin = os.path.splitext(mask_rcnn_model_xml)[0] + '.bin'
+
+    text_enc_model_xml = args.text_enc_model
+    text_enc_model_bin = os.path.splitext(text_enc_model_xml)[0] + '.bin'
+
+    text_dec_model_xml = args.text_dec_model
+    text_dec_model_bin = os.path.splitext(text_dec_model_xml)[0] + '.bin'
+
+    # Plugin initialization for specified device and load extensions library if specified.
+    log.info('Creating Inference Engine...')
+    ie = IECore()
+    if args.cpu_extension and 'CPU' in args.device:
+        ie.add_extension(args.cpu_extension, 'CPU')
+    # Read IR
+    log.info('Loading network files:\n\t{}\n\t{}'.format(mask_rcnn_model_xml, mask_rcnn_model_bin))
+    mask_rcnn_net = IENetwork(model=mask_rcnn_model_xml, weights=mask_rcnn_model_bin)
+
+    log.info('Loading network files:\n\t{}\n\t{}'.format(text_enc_model_xml, text_enc_model_bin))
+    text_enc_net = IENetwork(model=text_enc_model_xml, weights=text_enc_model_bin)
+
+    log.info('Loading network files:\n\t{}\n\t{}'.format(text_dec_model_xml, text_dec_model_bin))
+    text_dec_net = IENetwork(model=text_dec_model_xml, weights=text_dec_model_bin)
+
+    if 'CPU' in args.device:
+        supported_layers = ie.query_network(mask_rcnn_net, 'CPU')
+        not_supported_layers = [l for l in mask_rcnn_net.layers.keys() if l not in supported_layers]
+        if len(not_supported_layers) != 0:
+            log.error('Following layers are not supported by the plugin for specified device {}:\n {}'.
+                      format(args.device, ', '.join(not_supported_layers)))
+            log.error("Please try to specify cpu extensions library path in sample's command line parameters using -l "
+                      "or --cpu_extension command line argument")
+            sys.exit(1)
+
+    required_input_keys = {'im_data', 'im_info'}
+    assert required_input_keys == set(mask_rcnn_net.inputs.keys()), \
+        'Demo supports only topologies with the following input keys: {}'.format(', '.join(required_input_keys))
+    required_output_keys = {'boxes', 'scores', 'classes', 'raw_masks', 'text_features'}
+    assert required_output_keys.issubset(mask_rcnn_net.outputs.keys()), \
+        'Demo supports only topologies with the following output keys: {}'.format(', '.join(required_output_keys))
+
+    n, c, h, w = mask_rcnn_net.inputs['im_data'].shape
+    assert n == 1, 'Only batch 1 is supported by the demo application'
+
+    log.info('Loading IR to the plugin...')
+    mask_rcnn_exec_net = ie.load_network(network=mask_rcnn_net, device_name=args.device, num_requests=2)
+    text_enc_exec_net = ie.load_network(network=text_enc_net, device_name=args.device)
+    text_dec_exec_net = ie.load_network(network=text_dec_net, device_name=args.device)
+
+    hidden_shape = text_dec_net.inputs[args.trd_input_prev_hidden].shape
+
+    del mask_rcnn_net
+    del text_enc_net
+    del text_dec_net
+
+    try:
+        input_source = int(args.input_source)
+    except ValueError:
+        input_source = args.input_source
+
+    if os.path.isdir(input_source):
+        cap = FolderCapture(input_source)
+    else:
+        cap = cv2.VideoCapture(input_source)
+
+    if not cap.isOpened():
+        log.error('Failed to open "{}"'.format(args.input_source))
+    if isinstance(cap, cv2.VideoCapture):
+        cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)
+
+    if args.no_track:
+        tracker = None
+    else:
+        tracker = StaticIOUTracker()
+
+    visualizer = Visualizer(['__background__', 'text'], show_boxes=args.show_boxes, show_scores=args.show_scores)
+
+    render_time = 0
+
+    log.info('Starting inference...')
+    print("To close the application, press 'CTRL+C' here or switch to the output window and press ESC key")
+    while cap.isOpened():
+        ret, frame = cap.read()
+        if not ret:
+            break
+
+        if not args.keep_aspect_ratio:
+            # Resize the image to a target size.
+            scale_x = w / frame.shape[1]
+            scale_y = h / frame.shape[0]
+            input_image = cv2.resize(frame, (w, h))
+        else:
+            # Resize the image to keep the same aspect ratio and to fit it to a window of a target size.
+            scale_x = scale_y = min(h / frame.shape[0], w / frame.shape[1])
+            input_image = cv2.resize(frame, None, fx=scale_x, fy=scale_y)
+
+        input_image_size = input_image.shape[:2]
+        input_image = np.pad(input_image, ((0, h - input_image_size[0]),
+                                           (0, w - input_image_size[1]),
+                                           (0, 0)),
+                             mode='constant', constant_values=0)
+        # Change data layout from HWC to CHW.
+        input_image = input_image.transpose((2, 0, 1))
+        input_image = input_image.reshape((n, c, h, w)).astype(np.float32)
+        input_image_info = np.asarray([[input_image_size[0], input_image_size[1], 1]], dtype=np.float32)
+
+        # Run the net.
+        inf_start = time.time()
+        outputs = mask_rcnn_exec_net.infer({'im_data': input_image, 'im_info': input_image_info})
+
+        # Parse detection results of the current request
+        boxes = outputs['boxes']
+        scores = outputs['scores']
+        classes = outputs['classes'].astype(np.uint32)
+        raw_masks = outputs['raw_masks']
+        text_features = outputs['text_features']
+
+        # Filter out detections with low confidence.
+        detections_filter = scores > args.prob_threshold
+        scores = scores[detections_filter]
+        classes = classes[detections_filter]
+        boxes = boxes[detections_filter]
+        raw_masks = raw_masks[detections_filter]
+        text_features = text_features[detections_filter]
+
+        boxes[:, 0::2] /= scale_x
+        boxes[:, 1::2] /= scale_y
+        masks = []
+        for box, cls, raw_mask in zip(boxes, classes, raw_masks):
+            raw_cls_mask = raw_mask[cls, ...]
+            mask = segm_postprocess(box, raw_cls_mask, frame.shape[0], frame.shape[1])
+            masks.append(mask)
+
+        texts = []
+        for feature in text_features:
+            feature = text_enc_exec_net.infer({'input': feature})['output']
+            feature = np.reshape(feature, (feature.shape[0], feature.shape[1], -1))
+            feature = np.transpose(feature, (0, 2, 1))
+
+            hidden = np.zeros(hidden_shape)
+            prev_symbol_index = np.ones((1,)) * SOS_INDEX
+
+            text = ''
+            for i in range(MAX_SEQ_LEN):
+                decoder_output = text_dec_exec_net.infer({
+                    args.trd_input_prev_symbol: prev_symbol_index,
+                    args.trd_input_prev_hidden: hidden,
+                    args.trd_input_encoder_outputs: feature})
+                symbols_distr = decoder_output[args.trd_output_symbols_distr]
+                prev_symbol_index = int(np.argmax(symbols_distr, axis=1))
+                if prev_symbol_index == EOS_INDEX:
+                    break
+                text += args.alphabet[prev_symbol_index]
+                hidden = decoder_output[args.trd_output_cur_hidden]
+
+            texts.append(text)
+
+        inf_end = time.time()
+        inf_time = inf_end - inf_start
+
+        render_start = time.time()
+
+        if len(boxes) and args.raw_output_message:
+            log.info('Detected boxes:')
+            log.info('  Class ID | Confidence |     XMIN |     YMIN |     XMAX |     YMAX ')
+            for box, cls, score, mask in zip(boxes, classes, scores, masks):
+                log.info('{:>10} | {:>10f} | {:>8.2f} | {:>8.2f} | {:>8.2f} | {:>8.2f} '.format(cls, score, *box))
+
+        # Get instance track IDs.
+        masks_tracks_ids = None
+        if tracker is not None:
+            masks_tracks_ids = tracker(masks, classes)
+
+        # Visualize masks.
+        frame = visualizer(frame, boxes, classes, scores, masks, texts, masks_tracks_ids)
+
+        # Draw performance stats.
+        inf_time_message = 'Inference and post-processing time: {:.3f} ms'.format(inf_time * 1000)
+        render_time_message = 'OpenCV rendering time: {:.3f} ms'.format(render_time * 1000)
+        cv2.putText(frame, inf_time_message, (15, 15), cv2.FONT_HERSHEY_COMPLEX, 0.5, (200, 10, 10), 1)
+        cv2.putText(frame, render_time_message, (15, 30), cv2.FONT_HERSHEY_COMPLEX, 0.5, (10, 10, 200), 1)
+
+        # Print performance counters.
+        if args.perf_counts:
+            perf_counts = mask_rcnn_exec_net.requests[0].get_perf_counts()
+            log.info('Performance counters:')
+            print('{:<70} {:<15} {:<15} {:<15} {:<10}'.format('name', 'layer_type', 'exet_type', 'status',
+                                                              'real_time, us'))
+            for layer, stats in perf_counts.items():
+                print('{:<70} {:<15} {:<15} {:<15} {:<10}'.format(layer, stats['layer_type'], stats['exec_type'],
+                                                                  stats['status'], stats['real_time']))
+
+        if not args.no_show:
+            # Show resulting image.
+            cv2.imshow('Results', frame)
+        render_end = time.time()
+        render_time = render_end - render_start
+
+        if not args.no_show:
+            key = cv2.waitKey(args.delay)
+            esc_code = 27
+            if key == esc_code:
+                break
+
+    cv2.destroyAllWindows()
+    cap.release()
+
+
+if __name__ == '__main__':
+    sys.exit(main() or 0)
diff --git a/demos/python_demos/text_spotting_demo/text_spotting_demo/__init__.py b/demos/python_demos/text_spotting_demo/text_spotting_demo/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/demos/python_demos/text_spotting_demo/text_spotting_demo/tracker.py b/demos/python_demos/text_spotting_demo/text_spotting_demo/tracker.py
new file mode 100644
index 00000000000..c6730c39b5c
--- /dev/null
+++ b/demos/python_demos/text_spotting_demo/text_spotting_demo/tracker.py
@@ -0,0 +1,97 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import numpy as np
+
+
+class StaticIOUTracker(object):
+    def __init__(self, iou_threshold=0.5, age_threshold=10):
+        super().__init__()
+        self.history = []
+        self.history_areas = []
+        self.history_classes = []
+        self.ids = []
+        self.age = []
+        self.iou_threshold = iou_threshold
+        self.age_threshold = age_threshold
+        self.last_id = 0
+
+    def affinity(self, masks, classes):
+        areas = [np.count_nonzero(mask) for mask in masks]
+        affinity_matrix = np.zeros((len(masks), len(self.history)), dtype=np.float32)
+        for i, (history_mask, history_area, history_class) in \
+                enumerate(zip(self.history, self.history_areas, self.history_classes)):
+            for j, (mask, area, cls) in enumerate(zip(masks, areas, classes)):
+                if cls != history_class:
+                    continue
+                intersection = np.count_nonzero(np.logical_and(history_mask, mask))
+                union = history_area + area - intersection
+                iou = intersection / union
+                affinity_matrix[j, i] = iou
+        return affinity_matrix, areas
+
+    def __call__(self, masks, classes):
+        # Get affinity with history.
+        affinity_matrix, areas = self.affinity(masks, classes)
+
+        # Make assignment of currents masks to existing tracks.
+        assignment = []
+        indices = np.arange(len(self.history))
+        for i in range(len(masks)):
+            j = 0
+            affinity_score = -1.0
+            if affinity_matrix.shape[1] > 0:
+                j = np.argmax(affinity_matrix[i])
+                affinity_score = affinity_matrix[i, j]
+            if affinity_score > self.iou_threshold:
+                assignment.append(indices[j])
+                affinity_matrix = np.delete(affinity_matrix, j, 1)
+                indices = np.delete(indices, j)
+            else:
+                assignment.append(None)
+
+        # Increase age for existing tracks.
+        for i in range(len(self.age)):
+            self.age[i] += 1
+
+        # Update existing tracks.
+        for i, j in enumerate(assignment):
+            if j is not None:
+                self.history[j] = masks[i]
+                self.history_areas[j] = areas[i]
+                self.age[j] = 0
+                assignment[i] = self.ids[j]
+
+        # Prune out too old tracks.
+        alive = tuple(i for i, age in enumerate(self.age) if age < self.age_threshold)
+        self.history = list(self.history[i] for i in alive)
+        self.history_areas = list(self.history_areas[i] for i in alive)
+        self.history_classes = list(self.history_classes[i] for i in alive)
+        self.age = list(self.age[i] for i in alive)
+        self.ids = list(self.ids[i] for i in alive)
+
+        # Save new tracks.
+        for i, j in enumerate(assignment):
+            if j is None:
+                self.history.append(masks[i])
+                self.history_areas.append(areas[i])
+                self.history_classes.append(classes[i])
+                self.age.append(0)
+                self.ids.append(self.last_id)
+                assignment[i] = self.last_id
+                self.last_id += 1
+
+        return assignment
diff --git a/demos/python_demos/text_spotting_demo/text_spotting_demo/visualizer.py b/demos/python_demos/text_spotting_demo/text_spotting_demo/visualizer.py
new file mode 100644
index 00000000000..7dd0cab4117
--- /dev/null
+++ b/demos/python_demos/text_spotting_demo/text_spotting_demo/visualizer.py
@@ -0,0 +1,180 @@
+"""
+ Copyright (c) 2019 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+from __future__ import print_function
+
+import cv2
+import numpy as np
+
+
+class Visualizer(object):
+    instance_color_palette = np.array([[0, 113, 188],
+                                       [216, 82, 24],
+                                       [236, 176, 31],
+                                       [125, 46, 141],
+                                       [118, 171, 47],
+                                       [76, 189, 237],
+                                       [161, 19, 46],
+                                       [76, 76, 76],
+                                       [153, 153, 153],
+                                       [255, 0, 0],
+                                       [255, 127, 0],
+                                       [190, 190, 0],
+                                       [0, 255, 0],
+                                       [0, 0, 255],
+                                       [170, 0, 255],
+                                       [84, 84, 0],
+                                       [84, 170, 0],
+                                       [84, 255, 0],
+                                       [170, 84, 0],
+                                       [170, 170, 0],
+                                       [170, 255, 0],
+                                       [255, 84, 0],
+                                       [255, 170, 0],
+                                       [255, 255, 0],
+                                       [0, 84, 127],
+                                       [0, 170, 127],
+                                       [0, 255, 127],
+                                       [84, 0, 127],
+                                       [84, 84, 127],
+                                       [84, 170, 127],
+                                       [84, 255, 127],
+                                       [170, 0, 127],
+                                       [170, 84, 127],
+                                       [170, 170, 127],
+                                       [170, 255, 127],
+                                       [255, 0, 127],
+                                       [255, 84, 127],
+                                       [255, 170, 127],
+                                       [255, 255, 127],
+                                       [0, 84, 255],
+                                       [0, 170, 255],
+                                       [0, 255, 255],
+                                       [84, 0, 255],
+                                       [84, 84, 255],
+                                       [84, 170, 255],
+                                       [84, 255, 255],
+                                       [170, 0, 255],
+                                       [170, 84, 255],
+                                       [170, 170, 255],
+                                       [170, 255, 255],
+                                       [255, 0, 255],
+                                       [255, 84, 255],
+                                       [255, 170, 255],
+                                       [42, 0, 0],
+                                       [84, 0, 0],
+                                       [127, 0, 0],
+                                       [170, 0, 0],
+                                       [212, 0, 0],
+                                       [255, 0, 0],
+                                       [0, 42, 0],
+                                       [0, 84, 0],
+                                       [0, 127, 0],
+                                       [0, 170, 0],
+                                       [0, 212, 0],
+                                       [0, 255, 0],
+                                       [0, 0, 42],
+                                       [0, 0, 84],
+                                       [0, 0, 127],
+                                       [0, 0, 170],
+                                       [0, 0, 212],
+                                       [0, 0, 255],
+                                       [0, 0, 0],
+                                       [36, 36, 36],
+                                       [72, 72, 72],
+                                       [109, 109, 109],
+                                       [145, 145, 145],
+                                       [182, 182, 182],
+                                       [218, 218, 218],
+                                       [255, 255, 255]], dtype=np.uint8)
+
+    class_color_palette = np.asarray([2 ** 25 - 1, 2 ** 15 - 1, 2 ** 21 - 1])
+
+    def __init__(self, class_labels, show_boxes=False,
+                 show_masks=True, show_scores=False):
+        super().__init__()
+        self.class_labels = class_labels
+        self.show_masks = show_masks
+        self.show_boxes = show_boxes
+        self.show_scores = show_scores
+
+    def __call__(self, image, boxes, classes, scores, segms, texts, ids=None):
+        if self.show_masks and segms is not None:
+            image = self.overlay_masks(image, segms, ids)
+
+        if self.show_boxes:
+            image = self.overlay_boxes(image, boxes, classes)
+
+        image = self.overlay_class_names(image, boxes, texts, scores, show_score=self.show_scores)
+
+        return image
+
+    def compute_colors_for_labels(self, labels):
+        colors = labels[:, None] * self.class_color_palette
+        colors = (colors % 255).astype(np.uint8)
+        return colors
+
+    def overlay_boxes(self, image, boxes, classes):
+        colors = self.compute_colors_for_labels(classes).tolist()
+        for box, color in zip(boxes, colors):
+            box = box.astype(int)
+            top_left, bottom_right = box[:2].tolist(), box[2:].tolist()
+            image = cv2.rectangle(
+                image, tuple(top_left), tuple(bottom_right), tuple(color), 1
+            )
+        return image
+
+    def overlay_masks(self, image, masks, ids=None):
+        segments_image = image.copy()
+        aggregated_mask = np.zeros(image.shape[:2], dtype=np.uint8)
+        aggregated_colored_mask = np.zeros(image.shape, dtype=np.uint8)
+        black = np.zeros(3, dtype=np.uint8)
+
+        all_contours = []
+        for i, mask in enumerate(masks):
+            color_idx = i if ids is None else ids[i]
+            mask_color = self.instance_color_palette[color_idx % len(self.instance_color_palette)].tolist()
+
+            contours = cv2.findContours(mask, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)[-2]
+            if contours:
+                all_contours.append(contours[0])
+
+            cv2.bitwise_or(aggregated_mask, mask, dst=aggregated_mask)
+            cv2.bitwise_or(aggregated_colored_mask, np.asarray(mask_color, dtype=np.uint8),
+                           dst=aggregated_colored_mask, mask=mask)
+
+        # Fill the area occupied by all instances with a colored instances mask image.
+        cv2.bitwise_and(segments_image, black, dst=segments_image, mask=aggregated_mask)
+        cv2.bitwise_or(segments_image, aggregated_colored_mask, dst=segments_image, mask=aggregated_mask)
+        # Blend original image with the one, where instances are colored.
+        # As a result instances masks become transparent.
+        cv2.addWeighted(image, 0.5, segments_image, 0.5, 0, dst=image)
+
+        cv2.drawContours(image, all_contours, -1, (0, 0, 0))
+
+        return image
+
+    def overlay_class_names(self, image, boxes, texts, scores, show_score=True):
+        template = '{}: {:.2f}' if show_score else '{}'
+        white = (255, 255, 255)
+
+        for box, score, label in zip(boxes, scores, texts):
+            s = template.format(label, score)
+            textsize = cv2.getTextSize(s, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)[0]
+            position = ((box[:2] + box[2:] - textsize) / 2).astype(int)
+            cv2.putText(image, s, tuple(position), cv2.FONT_HERSHEY_SIMPLEX, .5, white, 1)
+
+        return image
diff --git a/demos/security_barrier_camera_demo/CMakeLists.txt b/demos/security_barrier_camera_demo/CMakeLists.txt
index 4f0ade22c1b..ebfab186404 100644
--- a/demos/security_barrier_camera_demo/CMakeLists.txt
+++ b/demos/security_barrier_camera_demo/CMakeLists.txt
@@ -8,4 +8,5 @@ file (GLOB HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/*.hpp)
 ie_add_sample(NAME security_barrier_camera_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES core highgui videoio)
diff --git a/demos/security_barrier_camera_demo/README.md b/demos/security_barrier_camera_demo/README.md
index bb2d423626e..83f3abb307b 100644
--- a/demos/security_barrier_camera_demo/README.md
+++ b/demos/security_barrier_camera_demo/README.md
@@ -1,11 +1,11 @@
-# Security Barrier Camera С++ Demo
+# Security Barrier Camera C++ Demo
 
 This demo showcases Vehicle and License Plate Detection network followed by the Vehicle Attributes Recognition and License Plate Recognition networks applied on top
 of the detection results. You can use a set of the following pre-trained models with the demo:
-* `vehicle-license-plate-detection-barrier-0106`, which is a primary detection network to find the vehicles and license plates
+* `vehicle-license-plate-detection-barrier-0106` or `vehicle-license-plate-detection-barrier-0123`, which is primary detection network to find the vehicles and license plates
 * `vehicle-attributes-recognition-barrier-0039`, which is executed on top of the results from the first network and
 reports general vehicle attributes, for example, vehicle type (car/van/bus/track) and color
-* `license-plate-recognition-barrier-0001`, which is executed on top of the results from the first network
+* `license-plate-recognition-barrier-0001` or `license-plate-recognition-barrier-0007`, which is executed on top of the results from the first network
 and reports a string per recognized license plate
 
 For more information about the pre-trained models, refer to the [model documentation](../../models/intel/index.md).
@@ -42,10 +42,8 @@ At the end of the sequence, the `VideoFrame` is destroyed and the sequence start
 ## Running
 
 Running the application with the <code>-h</code> option yields the following usage message:
-```sh
-[ INFO ] InferenceEngine:
-    API version ............ <version>
-    Build .................. <number>
+```
+[ INFO ] InferenceEngine: <version>
 
 interactive_vehicle_detection [OPTION]
 Options:
@@ -78,7 +76,7 @@ Options:
     -tag                       Required for HDDL plugin only. If not set, the performance on Intel(R) Movidius(TM) X VPUs will not be optimal. Running each network on a set of Intel(R) Movidius(TM) X VPUs with a specific tag. You must specify the number of VPUs for each network in the hddl_service.config file. Refer to the corresponding README file for more information.
     -nstreams "<integer>"      Optional. Number of streams to use for inference on the CPU or/and GPU in throughput mode (for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> or just <nstreams>)
     -nthreads "<integer>"      Optional. Number of threads to use for inference on the CPU (including HETERO and MULTI cases).
-
+    -u                         Optional. List of monitors to show initially.
 ```
 
 Running the application with an empty list of options yields an error message.
@@ -98,13 +96,24 @@ To do inference for two video inputs using two asynchronous infer request on FPG
 ./security_barrier_camera_demo -i <path_to_video>/inputVideo_0.mp4 <path_to_video>/inputVideo_1.mp4 -m <path_to_model>/vehicle-license-plate-detection-barrier-0106.xml -m_va <path_to_model>/vehicle-attributes-recognition-barrier-0039.xml -m_lpr <path_to_model>/license-plate-recognition-barrier-0001.xml -d HETERO:FPGA,CPU -d_va HETERO:FPGA,CPU -d_lpr HETERO:FPGA,CPU -nireq 2
 ```
 
-> **NOTE**: For the `-tag` option (HDDL plugin only), you must specify the number of VPUs for each network in the `hddl_service.config` file located in the `<INSTALL_DIR>/deployment_tools/inference_engine/external/hddl/config/` direcrtory using the following tags:
+To do inference for video inputs on Intel® Vision Accelerator Design with Intel® Movidius™ VPUs, some optimization hints are suggested to make good use of the computation ability:
+
+* configuring the number of allocated frames (`-n_iqs`) to provide enough inputs for inference;
+* configuring the number of infer request (`-nireq`) to achieve asynchronous inference;
+* configuring the number of threads (`-n_wt`) for multi-threaded processing.
+
+For example, to run the sample on one Intel® Vision Accelerator Design with Intel® Movidius™ VPUs Compact R card, run the following command:
+```sh
+./security_barrier_camera_demo -i <path_to_video>/inputVideo.mp4 -m <path_to_model>/vehicle-license-plate-detection-barrier-0106.xml -m_va <path_to_model>/vehicle-attributes-recognition-barrier-0039.xml -m_lpr <path_to_model>/license-plate-recognition-barrier-0001.xml -d HDDL -d_va HDDL -d_lpr HDDL -n_iqs 10 -n_wt 4 -nireq 10
+```
+
+> **NOTE**: For the `-tag` option (HDDL plugin only), you must specify the number of VPUs for each network in the `hddl_service.config` file located in the `<INSTALL_DIR>/deployment_tools/inference_engine/external/hddl/config/` directory using the following tags:
 > * `tagDetect` for the Vehicle and License Plate Detection network
 > * `tagAttr` for the Vehicle Attributes Recognition network
 > * `tagLPR` for the License Plate Recognition network
 >
 > For example, to run the sample on one Intel® Vision Accelerator Design with Intel® Movidius™ VPUs Compact R card with eight Intel&reg; Movidius&trade; X VPUs:
-> ```sh
+> ```json
 > "service_settings":
 > {
 >  "graph_tag_map":{"tagDetect": 6, "tagAttr": 1, "tagLPR": 1}
@@ -114,7 +123,7 @@ To do inference for two video inputs using two asynchronous infer request on FPG
 
 ### Optimization Hints for Heterogeneous Scenarios with FPGA
 
-If you build the Inference Engine with the OMP, you can use the following parameters for Heterogeneous scenarois:
+If you build the Inference Engine with the OMP, you can use the following parameters for Heterogeneous scenarios:
 
 * `OMP_NUM_THREADS`: Specifies number of threads to use. For heterogeneous scenarios with FPGA, when several inference requests are used asynchronously, limiting the number of CPU threads with `OMP_NUM_THREADS` allows to avoid competing for resources between threads. For the Security Barrier Camera Demo, recommended value is `OMP_NUM_THREADS=1`.
 * `KMP_BLOCKTIME`: Sets the time, in milliseconds, that a thread should wait, after completing the execution of a parallel region, before sleeping. The default value is 200ms, which is not optimal for the demo. Recommended value is `KMP_BLOCKTIME=1`.
@@ -123,7 +132,7 @@ If you build the Inference Engine with the OMP, you can use the following parame
 
 The demo uses OpenCV to display the resulting frame with detections rendered as bounding boxes and text.
 
-> **NOTE**: On VPU devices (Intel® Movidius™ Neural Compute Stick, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs) this demo has been tested on the following Model Downloader available topologies: 
+> **NOTE**: On VPU devices (Intel® Movidius™ Neural Compute Stick, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs) this demo has been tested on the following Model Downloader available topologies:
 >* `license-plate-recognition-barrier-0001`
 >* `vehicle-attributes-recognition-barrier-0039`
 >* `vehicle-license-plate-detection-barrier-0106`
diff --git a/demos/security_barrier_camera_demo/common.hpp b/demos/security_barrier_camera_demo/common.hpp
index 6bc524ae220..3db9d994fda 100644
--- a/demos/security_barrier_camera_demo/common.hpp
+++ b/demos/security_barrier_camera_demo/common.hpp
@@ -56,13 +56,13 @@ struct HigherPriority {
 class Worker {
 public:
     explicit Worker(unsigned threadNum):
-        threadPull(threadNum), running{false} {}
+        threadPool(threadNum), running{false} {}
     ~Worker() {
         stop();
     }
     void runThreads() {
         running = true;
-        for (std::thread& t : threadPull) {
+        for (std::thread& t : threadPool) {
             t = std::thread(&Worker::threadFunc, this);
         }
     }
@@ -100,7 +100,7 @@ class Worker {
         tasksCondVar.notify_all();
     }
     void join() {
-        for (auto& t : threadPull) {
+        for (auto& t : threadPool) {
             t.join();
         }
         if (nullptr != currentException) {
@@ -112,7 +112,7 @@ class Worker {
     std::condition_variable tasksCondVar;
     std::set<std::shared_ptr<Task>, HigherPriority> tasks;
     std::mutex tasksMutex;
-    std::vector<std::thread> threadPull;
+    std::vector<std::thread> threadPool;
     std::atomic<bool> running;
     std::exception_ptr currentException;
     std::mutex excpetionMutex;
diff --git a/demos/security_barrier_camera_demo/main.cpp b/demos/security_barrier_camera_demo/main.cpp
index 3eb25aea05e..e178c381586 100644
--- a/demos/security_barrier_camera_demo/main.cpp
+++ b/demos/security_barrier_camera_demo/main.cpp
@@ -16,9 +16,7 @@
 #include <cldnn/cldnn_config.hpp>
 #include <inference_engine.hpp>
 #include <vpu/vpu_plugin_config.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/args_helper.hpp>
 
@@ -59,7 +57,7 @@ bool ParseAndCheckCommandLine(int argc, char *argv[]) {
 struct BboxAndDescr {
     enum class ObjectType {
         NONE,
-        VEHICCLE,
+        VEHICLE,
         PLATE,
     } objectType;
     cv::Rect rect;
@@ -67,22 +65,19 @@ struct BboxAndDescr {
 };
 
 struct InferRequestsContainer {
-    explicit InferRequestsContainer(std::vector<InferRequest> inferRequests):
-        actualInferRequests{inferRequests} {
-        for (auto& ir : actualInferRequests) {
-            inferRequests.push_back(ir);
-        }
-    }
     InferRequestsContainer() = default;
-    InferRequestsContainer& operator=(const InferRequestsContainer& other) {  // copy assignment
-        if (this != &other) {  // self-assignment check expected
-            this->actualInferRequests = other.actualInferRequests;
-            for (auto& ir : this->actualInferRequests) {
-                this->inferRequests.container.push_back(ir);
-            }
+    InferRequestsContainer(const InferRequestsContainer&) = delete;
+    InferRequestsContainer& operator=(const InferRequestsContainer&) = delete;
+
+    void assign(const std::vector<InferRequest>& inferRequests) {
+        actualInferRequests = inferRequests;
+        this->inferRequests.container.clear();
+
+        for (auto& ir : this->actualInferRequests) {
+            this->inferRequests.container.push_back(ir);
         }
-        return *this;
     }
+
     std::vector<InferRequest> getActualInferRequests() {
         return actualInferRequests;
     }
@@ -97,7 +92,7 @@ struct Context {  // stores all global data for tasks
             const Detector& detector, const std::weak_ptr<Worker>& inferTasksWorker,
             const VehicleAttributesClassifier& vehicleAttributesClassifier, const Lpr& lpr, const std::weak_ptr<Worker>& detectionsProcessorsWorker,
             int pause, const std::vector<cv::Size>& gridParam, cv::Size displayResolution, std::chrono::steady_clock::duration showPeriod,
-                const std::weak_ptr<Worker>& drawersWorker,
+                const std::weak_ptr<Worker>& drawersWorker, const std::string& monitorsStr,
             uint64_t lastFrameId,
             const std::weak_ptr<Worker> resAggregatorsWorker,
             uint64_t nireq,
@@ -106,7 +101,7 @@ struct Context {  // stores all global data for tasks
         readersContext{inputChannels, readersWorker, std::vector<int64_t>(inputChannels.size(), -1), std::vector<std::mutex>(inputChannels.size())},
         inferTasksContext{detector, inferTasksWorker},
         detectionsProcessorsContext{vehicleAttributesClassifier, lpr, detectionsProcessorsWorker},
-        drawersContext{pause, gridParam, displayResolution, showPeriod, drawersWorker},
+        drawersContext{pause, gridParam, displayResolution, showPeriod, drawersWorker, monitorsStr},
         videoFramesContext{std::vector<uint64_t>(inputChannels.size(), lastFrameId), std::vector<std::mutex>(inputChannels.size())},
         resAggregatorsWorker{resAggregatorsWorker},
         nireq{nireq},
@@ -128,9 +123,9 @@ struct Context {  // stores all global data for tasks
             return detectionsProcessorsContext.vehicleAttributesClassifier.createInferRequest();});
         std::generate_n(std::back_inserter(lprInferRequests), nrecognizersireq, [&]{
             return detectionsProcessorsContext.lpr.createInferRequest();});
-        detectorsInfers = InferRequestsContainer(detectorInferRequests);
-        attributesInfers = InferRequestsContainer(attributesInferRequests);
-        platesInfers = InferRequestsContainer(lprInferRequests);
+        detectorsInfers.assign(detectorInferRequests);
+        attributesInfers.assign(attributesInferRequests);
+        platesInfers.assign(lprInferRequests);
     }
     struct {
         std::vector<std::shared_ptr<InputChannel>> inputChannels;
@@ -149,9 +144,12 @@ struct Context {  // stores all global data for tasks
     } detectionsProcessorsContext;
     struct DrawersContext {
         DrawersContext(int pause, const std::vector<cv::Size>& gridParam, cv::Size displayResolution, std::chrono::steady_clock::duration showPeriod,
-                       const std::weak_ptr<Worker>& drawersWorker):
+                       const std::weak_ptr<Worker>& drawersWorker, const std::string& monitorsStr):
             pause{pause}, gridParam{gridParam}, displayResolution{displayResolution}, showPeriod{showPeriod}, drawersWorker{drawersWorker},
-            lastShownframeId{0}, prevShow{std::chrono::steady_clock::time_point()}, framesAfterUpdate{0}, updateTime{std::chrono::steady_clock::time_point()} {}
+            lastShownframeId{0}, prevShow{std::chrono::steady_clock::time_point()}, framesAfterUpdate{0}, updateTime{std::chrono::steady_clock::time_point()},
+            presenter{monitorsStr,
+                GridMat(gridParam, displayResolution).outimg.rows - 70,
+                cv::Size{GridMat(gridParam, displayResolution).outimg.cols / 4, 60}} {}
         int pause;
         std::vector<cv::Size> gridParam;
         cv::Size displayResolution;
@@ -164,6 +162,7 @@ struct Context {  // stores all global data for tasks
         std::ostringstream outThroughput;
         unsigned framesAfterUpdate;
         std::chrono::steady_clock::time_point updateTime;
+        Presenter presenter;
     } drawersContext;
     struct {
         std::vector<uint64_t> lastframeIds;
@@ -360,6 +359,8 @@ void Drawer::process() {
         }
         cv::putText(mat, context.drawersContext.outThroughput.str(), cv::Point2f(15, 35), cv::FONT_HERSHEY_TRIPLEX, 0.7, cv::Scalar{255, 255, 255});
 
+        context.drawersContext.presenter.drawGraphs(mat);
+
         cv::imshow("Detection results", firstGridIt->second.getMat());
         context.drawersContext.prevShow = std::chrono::steady_clock::now();
         const int key = cv::waitKey(context.drawersContext.pause);
@@ -369,6 +370,8 @@ void Drawer::process() {
             } catch (const std::bad_weak_ptr&) {}
         } else if (key == 32) {
             context.drawersContext.pause = (context.drawersContext.pause + 1) & 1;
+        } else {
+            context.drawersContext.presenter.handleKey(key);
         }
         firstGridIt->second.clear();
         gridMats.emplace((--gridMats.end())->first + 1, firstGridIt->second);
@@ -386,7 +389,7 @@ void ResAggregator::process() {
             switch (bboxAndDescr.objectType) {
                 case BboxAndDescr::ObjectType::NONE: cv::rectangle(sharedVideoFrame->frame, bboxAndDescr.rect, {255, 255, 0},  4);
                                                      break;
-                case BboxAndDescr::ObjectType::VEHICCLE: cv::rectangle(sharedVideoFrame->frame, bboxAndDescr.rect, {0, 255, 0},  4);
+                case BboxAndDescr::ObjectType::VEHICLE: cv::rectangle(sharedVideoFrame->frame, bboxAndDescr.rect, {0, 255, 0},  4);
                                                          cv::putText(sharedVideoFrame->frame, bboxAndDescr.descr,
                                                                      cv::Point{bboxAndDescr.rect.x, bboxAndDescr.rect.y + 35},
                                                                      cv::FONT_HERSHEY_COMPLEX, 1.3, cv::Scalar(0, 255, 0), 4);
@@ -497,7 +500,7 @@ void DetectionsProcessor::process() {
                                 classifiersAggreagator->rawAttributes.lockedPush_back("Vehicle Attributes results:" + attributes.first + ';'
                                                                                       + attributes.second + '\n');
                             }
-                            classifiersAggreagator->push(BboxAndDescr{BboxAndDescr::ObjectType::VEHICCLE, rect, attributes.first + ' ' + attributes.second});
+                            classifiersAggreagator->push(BboxAndDescr{BboxAndDescr::ObjectType::VEHICLE, rect, attributes.first + ' ' + attributes.second});
                             context.attributesInfers.inferRequests.lockedPush_back(attributesRequest);
                         }, classifiersAggreagator,
                            std::ref(attributesRequest),
@@ -711,11 +714,6 @@ int main(int argc, char* argv[]) {
             std::cout << ie.GetVersions(device) << std::endl;
 
             if ("CPU" == device) {
-#ifdef WITH_EXTENSIONS
-                /** Load default extensions lib for the CPU device (e.g. SSD's DetectionOutput)**/
-                ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
-
                 if (!FLAGS_l.empty()) {
                     // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
                     auto extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -816,7 +814,7 @@ int main(int argc, char* argv[]) {
         Context context{inputChannels, worker,
                         detector, worker,
                         vehicleAttributesClassifier, lpr, worker,
-                        pause, gridParam, displayResolution, showPeriod, worker,
+                        pause, gridParam, displayResolution, showPeriod, worker, FLAGS_u,
                         FLAGS_n_iqs - 1,
                         worker,
                         nireq,
@@ -869,6 +867,8 @@ int main(int argc, char* argv[]) {
                 / (frameCounter * context.nireq) * 100;
             std::cout << "Detection InferRequests usage: " << detectionsInfersUsage << "%\n";
         }
+
+        std::cout << context.drawersContext.presenter.reportMeans() << '\n';
     } catch (const std::exception& error) {
         std::cerr << "[ ERROR ] " << error.what() << std::endl;
         return 1;
diff --git a/demos/security_barrier_camera_demo/net_wrappers.hpp b/demos/security_barrier_camera_demo/net_wrappers.hpp
index cc9d9ddaf35..0ce43fb5e56 100644
--- a/demos/security_barrier_camera_demo/net_wrappers.hpp
+++ b/demos/security_barrier_camera_demo/net_wrappers.hpp
@@ -26,14 +26,11 @@ class Detector {
     static constexpr int objectSize = 7;  // Output should have 7 as a last dimension"
 
     Detector() = default;
-    Detector(InferenceEngine::Core& ie, const std::string deviceName, const std::string& xmlPath, const std::vector<float>& detectionTresholds,
+    Detector(InferenceEngine::Core& ie, const std::string& deviceName, const std::string& xmlPath, const std::vector<float>& detectionTresholds,
             const bool autoResize, const std::map<std::string, std::string> & pluginConfig) :
         detectionTresholds{detectionTresholds}, ie_{ie} {
-        InferenceEngine::CNNNetReader netReader;
-        netReader.ReadNetwork(xmlPath);
-        std::string detectorBinFileName = fileNameNoExt(xmlPath) + ".bin";
-        netReader.ReadWeights(detectorBinFileName);
-        InferenceEngine::InputsDataMap inputInfo(netReader.getNetwork().getInputsInfo());
+        auto network = ie.ReadNetwork(xmlPath);
+        InferenceEngine::InputsDataMap inputInfo(network.getInputsInfo());
         if (inputInfo.size() != 1) {
             throw std::logic_error("Detector should have only one input");
         }
@@ -49,7 +46,7 @@ class Detector {
         detectorInputBlobName = inputInfo.begin()->first;
 
         // ---------------------------Check outputs ------------------------------------------------------
-        InferenceEngine::OutputsDataMap outputInfo(netReader.getNetwork().getOutputsInfo());
+        InferenceEngine::OutputsDataMap outputInfo(network.getOutputsInfo());
         if (outputInfo.size() != 1) {
             throw std::logic_error("Vehicle Detection network should have only one output");
         }
@@ -67,7 +64,7 @@ class Detector {
         }
         _output->setPrecision(InferenceEngine::Precision::FP32);
 
-        net = ie_.LoadNetwork(netReader.getNetwork(), deviceName, pluginConfig);
+        net = ie_.LoadNetwork(network, deviceName, pluginConfig);
     }
 
     InferenceEngine::InferRequest createInferRequest() {
@@ -133,11 +130,8 @@ class VehicleAttributesClassifier {
     VehicleAttributesClassifier() = default;
     VehicleAttributesClassifier(InferenceEngine::Core& ie, const std::string & deviceName,
         const std::string& xmlPath, const bool autoResize, const std::map<std::string, std::string> & pluginConfig) : ie_(ie) {
-        InferenceEngine::CNNNetReader attributesNetReader;
-        attributesNetReader.ReadNetwork(FLAGS_m_va);
-        std::string attributesBinFileName = fileNameNoExt(FLAGS_m_va) + ".bin";
-        attributesNetReader.ReadWeights(attributesBinFileName);
-        InferenceEngine::InputsDataMap attributesInputInfo(attributesNetReader.getNetwork().getInputsInfo());
+        auto network = ie.ReadNetwork(FLAGS_m_va);
+        InferenceEngine::InputsDataMap attributesInputInfo(network.getInputsInfo());
         if (attributesInputInfo.size() != 1) {
             throw std::logic_error("Vehicle Attribs topology should have only one input");
         }
@@ -152,7 +146,7 @@ class VehicleAttributesClassifier {
 
         attributesInputName = attributesInputInfo.begin()->first;
 
-        InferenceEngine::OutputsDataMap attributesOutputInfo(attributesNetReader.getNetwork().getOutputsInfo());
+        InferenceEngine::OutputsDataMap attributesOutputInfo(network.getOutputsInfo());
         if (attributesOutputInfo.size() != 2) {
             throw std::logic_error("Vehicle Attribs Network expects networks having two outputs");
         }
@@ -162,7 +156,7 @@ class VehicleAttributesClassifier {
         it->second->setPrecision(InferenceEngine::Precision::FP32);
         outputNameForType = (it)->second->getName();  // type is the second output.
 
-        net = ie_.LoadNetwork(attributesNetReader.getNetwork(), deviceName, pluginConfig);
+        net = ie_.LoadNetwork(network, deviceName, pluginConfig);
     }
 
     InferenceEngine::InferRequest createInferRequest() {
@@ -214,16 +208,13 @@ class Lpr {
     Lpr(InferenceEngine::Core& ie, const std::string & deviceName, const std::string& xmlPath, const bool autoResize,
         const std::map<std::string, std::string> &pluginConfig) :
         ie_{ie} {
-        InferenceEngine::CNNNetReader LprNetReader;
-        LprNetReader.ReadNetwork(FLAGS_m_lpr);
-        std::string lprBinFileName = fileNameNoExt(FLAGS_m_lpr) + ".bin";
-        LprNetReader.ReadWeights(lprBinFileName);
+        auto network = ie.ReadNetwork(FLAGS_m_lpr);
 
         /** LPR network should have 2 inputs (and second is just a stub) and one output **/
         // ---------------------------Check inputs ------------------------------------------------------
-        InferenceEngine::InputsDataMap LprInputInfo(LprNetReader.getNetwork().getInputsInfo());
-        if (LprInputInfo.size() != 2) {
-            throw std::logic_error("LPR should have 2 inputs");
+        InferenceEngine::InputsDataMap LprInputInfo(network.getInputsInfo());
+        if (LprInputInfo.size() != 1 && LprInputInfo.size() != 2) {
+            throw std::logic_error("LPR should have 1 or 2 inputs");
         }
         InferenceEngine::InputInfo::Ptr& LprInputInfoFirst = LprInputInfo.begin()->second;
         LprInputInfoFirst->setPrecision(InferenceEngine::Precision::U8);
@@ -234,19 +225,29 @@ class Lpr {
             LprInputInfoFirst->setLayout(InferenceEngine::Layout::NCHW);
         }
         LprInputName = LprInputInfo.begin()->first;
-        auto sequenceInput = (++LprInputInfo.begin());
-        LprInputSeqName = sequenceInput->first;
-        maxSequenceSizePerPlate = sequenceInput->second->getTensorDesc().getDims()[0];
+        if (LprInputInfo.size() == 2){
+            //LPR model that converted from Caffe have second a stub input
+            auto sequenceInput = (++LprInputInfo.begin());
+            LprInputSeqName = sequenceInput->first;
+        } else {
+            LprInputSeqName = "";
+        }
+
         // -----------------------------------------------------------------------------------------------------
 
         // ---------------------------Check outputs ------------------------------------------------------
-        InferenceEngine::OutputsDataMap LprOutputInfo(LprNetReader.getNetwork().getOutputsInfo());
+        InferenceEngine::OutputsDataMap LprOutputInfo(network.getOutputsInfo());
         if (LprOutputInfo.size() != 1) {
             throw std::logic_error("LPR should have 1 output");
         }
         LprOutputName = LprOutputInfo.begin()->first;
+        auto lprOutputInfo = (LprOutputInfo.begin());
 
-        net = ie_.LoadNetwork(LprNetReader.getNetwork(), deviceName, pluginConfig);
+        // Shape of output tensor for model that converted from Caffe is [1,88,1,1], from TF [1,1,88,1]
+        size_t indexOfSequenceSize = LprInputSeqName == "" ? 2 : 1;
+        maxSequenceSizePerPlate = lprOutputInfo->second->getTensorDesc().getDims()[indexOfSequenceSize];
+
+        net = ie_.LoadNetwork(network, deviceName, pluginConfig);
     }
 
     InferenceEngine::InferRequest createInferRequest() {
@@ -265,16 +266,19 @@ class Lpr {
             const cv::Mat& vehicleImage = img(plateRect);
             matU8ToBlob<uint8_t>(vehicleImage, roiBlob);
         }
-        InferenceEngine::Blob::Ptr seqBlob = inferRequest.GetBlob(LprInputSeqName);
-        // second input is sequence, which is some relic from the training
-        // it should have the leading 0.0f and rest 1.0f
-        float* blob_data = seqBlob->buffer().as<float*>();
-        blob_data[0] = 0.0f;
-        std::fill(blob_data + 1, blob_data + maxSequenceSizePerPlate, 1.0f);
+
+        if (LprInputSeqName != "") {
+            InferenceEngine::Blob::Ptr seqBlob = inferRequest.GetBlob(LprInputSeqName);
+            // second input is sequence, which is some relic from the training
+            // it should have the leading 0.0f and rest 1.0f
+            float* blob_data = seqBlob->buffer().as<float*>();
+            blob_data[0] = 0.0f;
+            std::fill(blob_data + 1, blob_data + seqBlob->getTensorDesc().getDims()[0], 1.0f);
+        }
     }
 
     std::string getResults(InferenceEngine::InferRequest& inferRequest) {
-        static const std::vector<std::string> items = {
+        static const char *const items[] = {
                 "0", "1", "2", "3", "4", "5", "6", "7", "8", "9",
                 "<Anhui>", "<Beijing>", "<Chongqing>", "<Fujian>",
                 "<Gansu>", "<Guangdong>", "<Guangxi>", "<Guizhou>",
@@ -297,7 +301,7 @@ class Lpr {
             if (data[i] == -1) {
                 break;
             }
-            result += items[static_cast<std::vector<std::string>::size_type>(data[i])];
+            result += items[std::size_t(data[i])];
         }
         return result;
     }
diff --git a/demos/security_barrier_camera_demo/security_barrier_camera_demo.hpp b/demos/security_barrier_camera_demo/security_barrier_camera_demo.hpp
index af0cd566291..8bafd7afda4 100644
--- a/demos/security_barrier_camera_demo/security_barrier_camera_demo.hpp
+++ b/demos/security_barrier_camera_demo/security_barrier_camera_demo.hpp
@@ -9,202 +9,82 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for enabling input video
 static const char video_message[] = "Required for video or image files input. Path to video or image files.";
-
-/// @brief message for model argument
 static const char detection_model_message[] = "Required. Path to the Vehicle and License Plate Detection model .xml file.";
 static const char vehicle_attribs_model_message[] = "Optional. Path to the Vehicle Attributes model .xml file.";
 static const char lpr_model_message[] = "Optional. Path to the License Plate Recognition model .xml file.";
-
-/// @brief message for assigning vehicle detection inference to device
-static const char target_device_message[] = "Optional. Specify the target device for Vehicle Detection "\
-                                            "(the list of available devices is shown below). Default value is CPU. " \
-                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message[] = "Optional. Specify the target device for Vehicle Detection "
+                                            "(the list of available devices is shown below). Default value is CPU. "
+                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                             "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for assigning vehicle attributes to device
-static const char target_device_message_vehicle_attribs[] = "Optional. Specify the target device for Vehicle Attributes "\
-                                                            "(the list of available devices is shown below). Default value is CPU. " \
-                                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_vehicle_attribs[] = "Optional. Specify the target device for Vehicle Attributes "
+                                                            "(the list of available devices is shown below). Default value is CPU. "
+                                                            "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                             "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for assigning LPR inference to device
-static const char target_device_message_lpr[] = "Optional. Specify the target device for License Plate Recognition "\
-                                                "(the list of available devices is shown below). Default value is CPU. " \
-                                                "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_lpr[] = "Optional. Specify the target device for License Plate Recognition "
+                                                "(the list of available devices is shown below). Default value is CPU. "
+                                                "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                 "The application looks for a suitable plugin for the specified device.";
-
-/// @brief message for performance counters
 static const char performance_counter_message[] = "Optional. Enables per-layer performance statistics.";
-
-/// @brief message raw output flag
 static const char raw_output_message[] = "Optional. Output inference results as raw values.";
-
-/// @brief message for probability threshold argument
 static const char thresh_output_message[] = "Optional. Probability threshold for vehicle and license plate detections.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to an .xml file with the kernels description.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementation.";
-
-/// @brief message no show processed video
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to an .xml file with the kernels description.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementation.";
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief message resizable input flag
 static const char input_resizable_message[] = "Optional. Enable resizable input with support of ROI crop and auto resize.";
-
-/// @brief message for number of infer requests
 static const char ninfer_request_message[] = "Optional. Number of infer requests. 0 sets the number of infer requests equal to the number of inputs.";
-
-/// @brief message for number of camera inputs
 static const char num_cameras[] = "Required for web camera input. Maximum number of processed camera inputs (web cameras).";
-
-/// @brief message for FPGA device IDs
 static const char fpga_device_ids_message[] = "Optional. Specify FPGA device IDs (0,1,n).";
-
-/// @brief Message for looping video argument
 static const char loop_video_output_message[] = "Optional. Enable playing video on a loop.";
-
-/// @brief message for inputs queue size
 static const char input_queue_size[] = "Optional. Number of allocated frames. It is a multiplier of the number of inputs.";
-
-/// @brief message for enabling channel duplication
-static const char ninputs_message[] = "Optional. Specify the number of channels generated from provided inputs (with -i and -nc keys). "\
-"For example, if only one camera is provided, but -ni is set to 2, the demo will process frames as if they are captured from two cameras. "\
-"0 sets the number of input channels equal to the number of provided inputs.";
-
-/// @brief message for setting playing fps
+static const char ninputs_message[] = "Optional. Specify the number of channels generated from provided inputs (with -i and -nc keys). "
+                                      "For example, if only one camera is provided, but -ni is set to 2, the demo will process frames as if they are captured from two cameras. "
+                                      "0 sets the number of input channels equal to the number of provided inputs.";
 static const char fps[] = "Optional. Set the playback speed not faster than the specified FPS. 0 removes the upper bound.";
-
-/// @brief message for setting the number of threads in Worker
 static const char worker_threads[] = "Optional. Set the number of threads including the main thread a Worker class will use.";
-
-/// @brief Message for display resolution argument
 static const char display_resolution_message[] = "Optional. Specify the maximum output window resolution.";
-
-/// @brief Message for using tag scheduler
 static const char use_tag_scheduler_message[] = "Required for HDDL plugin only. "
                                                 "If not set, the performance on Intel(R) Movidius(TM) X VPUs will not be optimal. "
                                                 "Running each network on a set of Intel(R) Movidius(TM) X VPUs with a specific tag. "
                                                 "You must specify the number of VPUs for each network in the hddl_service.config file. "
                                                 "Refer to the corresponding README file for more information.";
-
-/// @brief message for #threads for CPU inference
 static const char infer_num_threads_message[] = "Optional. Number of threads to use for inference on the CPU "
                                                 "(including HETERO and MULTI cases).";
-
-/// @brief message for #streams for CPU inference
 static const char infer_num_streams_message[] = "Optional. Number of streams to use for inference on the CPU or/and GPU in throughput mode "
                                                 "(for HETERO and MULTI device cases use format <device1>:<nstreams1>,<device2>:<nstreams2> or just <nstreams>)";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// \brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// \brief Define parameter for input video files <br>
-/// It is a optional parameter
 DEFINE_string(i, "", video_message);
-
-/// \brief Define parameter for vehicle detection  model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", detection_model_message);
-
-/// \brief Define parameter for vehicle attributes model file <br>
-/// It is a required parameter
 DEFINE_string(m_va, "", vehicle_attribs_model_message);
-
-/// \brief Define parameter for vehicle detection  model file <br>
-/// It is a required parameter
 DEFINE_string(m_lpr, "", lpr_model_message);
-
-/// \brief device the target device for vehicle detection infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// \brief device the target device for age gender detection on <br>
 DEFINE_string(d_va, "CPU", target_device_message_vehicle_attribs);
-
-/// \brief device the target device for head pose detection on <br>
 DEFINE_string(d_lpr, "CPU", target_device_message_lpr);
-
-/// \brief enable per-layer performance report <br>
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// \brief Flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// \brief Flag to output raw scoring results<br>
-/// It is an optional parameter
 DEFINE_double(t, 0.5, thresh_output_message);
-
-/// @brief clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// \brief Flag to disable processed video showing<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// \brief Enables resizable input<br>
-/// It is an optional parameter
 DEFINE_bool(auto_resize, false, input_resizable_message);
-
-/// \brief Flag to specify number of infer requests<br>
-/// It is an optional parameter
 DEFINE_uint32(nireq, 0, ninfer_request_message);
-
-/// \brief Flag to specify number of expected input channels<br>
-/// It is an optional parameter
 DEFINE_uint32(nc, 0, num_cameras);
-
-/// \brief Flag to specify FPGA device IDs
-/// It is an optional parameter
 DEFINE_string(fpga_device_ids, "", fpga_device_ids_message);
-
-/// \brief Define a flag to loop video<br>
-/// It is an optional parameter
 DEFINE_bool(loop_video, false, loop_video_output_message);
-
-/// \brief Flag to specify number of allocated frames. It is a multiplyir of inputs number.<br>
-/// It is an optional parameter
 DEFINE_uint32(n_iqs, 3, input_queue_size);
-
-/// \brief Flag to specify number of input channels. It will multiply channels by reusing provided ones if there is lack of inputs<br>
-/// It is an optional parameter
 DEFINE_uint32(ni, 0, ninputs_message);
-
-/// \brief Define parameter for playing FPS <br>
-/// It is a optional parameter
 DEFINE_uint32(fps, 0, fps);
-
-/// \brief Define parameter for the number of threads including the main theread a Worker will use<br>
-/// It is a optional parameter
 DEFINE_uint32(n_wt, 1, worker_threads);
-
-/// \brief Flag to specify the maximum output window resolution<br>
-/// It is an optional parameter
 DEFINE_string(display_resolution, "1920x1080", display_resolution_message);
-
-/// \brief Message for using tag scheduler<br>
-/// It is a optional parameter
 DEFINE_bool(tag, false, use_tag_scheduler_message);
-
-/// @brief Number of threads to use for inference on the CPU in throughput mode (also affects Hetero cases)
 DEFINE_uint32(nthreads, 0, infer_num_threads_message);
-
-/// @brief Number of streams to use for inference on the CPU (also affects Hetero cases)
 DEFINE_string(nstreams, "", infer_num_streams_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * \brief This function show a help message
@@ -242,4 +122,5 @@ void showUsage() {
     std::cout << "    -tag                       " << use_tag_scheduler_message << std::endl;
     std::cout << "    -nstreams \"<integer>\"      " << infer_num_streams_message << std::endl;
     std::cout << "    -nthreads \"<integer>\"      " << infer_num_threads_message << std::endl;
+    std::cout << "    -u                         " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/segmentation_demo/CMakeLists.txt b/demos/segmentation_demo/CMakeLists.txt
index 1ff3f6fe5c3..96593288855 100644
--- a/demos/segmentation_demo/CMakeLists.txt
+++ b/demos/segmentation_demo/CMakeLists.txt
@@ -5,4 +5,5 @@
 ie_add_sample(NAME segmentation_demo
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/segmentation_demo.h"
-              DEPENDENCIES format_reader)
+              DEPENDENCIES monitors
+              OPENCV_DEPENDENCIES highgui videoio imgproc core)
diff --git a/demos/segmentation_demo/README.md b/demos/segmentation_demo/README.md
index 5b9eed95fe9..504a049ec12 100644
--- a/demos/segmentation_demo/README.md
+++ b/demos/segmentation_demo/README.md
@@ -1,52 +1,52 @@
 # Image Segmentation C++ Demo
 
-This topic demonstrates how to run the Image Segmentation demo application, which does inference using image
-segmentation networks like FCN8.
+This topic demonstrates how to run the Image Segmentation demo application, which does inference using semantic segmentation networks.
 
 > **NOTE:** This topic describes usage of C++ implementation of the Image Segmentation Demo. For the Python* implementation, refer to [Image Segmentation Python* Demo](../python_demos/segmentation_demo/README.md).
 
 ## How It Works
 
-Upon the start-up the demo application reads command line parameters and loads a network and an image to the
-Inference Engine plugin. When inference is done, the application creates an output image.
+Upon the start-up the demo application reads command line parameters and loads a network. The demo runs inference and shows results for each image captured from an input. The demo's pipeline is latency oriented. The pipeline minimizes the tame required to process each single image.
 
 > **NOTE**: By default, Open Model Zoo demos expect input with BGR channels order. If you trained your model to work with RGB order, you need to manually rearrange the default channels order in the demo application or reconvert your model using the Model Optimizer tool with `--reverse_input_channels` argument specified. For more information about the argument, refer to **When to Reverse Input Channels** section of [Converting a Model Using General Conversion Parameters](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_prepare_model_convert_model_Converting_Model_General.html).
 
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./segmentation_demo -h
-InferenceEngine:
-    API version ............ <version>
-    Build .................. <number>
+[ INFO ] InferenceEngine: <version>
+[ INFO ] Parsing input parameters
 
 segmentation_demo [OPTION]
 Options:
 
     -h                        Print a usage message.
-    -i "<path>"               Required. Path to an .bmp image.
+    -i "<path>"               Required. Input to process.
     -m "<path>"               Required. Path to an .xml file with a trained model.
-      -l "<absolute_path>"    Required for CPU custom layers. Absolute path to a shared library with the kernel implementations.
+      -l "<absolute_path>"    Required for CPU custom layers. Absolute path to a shared library with the kernels implementations.
           Or
-      -c "<absolute_path>"    Required for GPU custom kernels. Absolute path to the xml file with the kernel descriptions.
+      -c "<absolute_path>"    Required for GPU custom kernels. Absolute path to the .xml file with the kernels descriptions.
     -d "<device>"             Optional. Specify the target device to infer on (the list of available devices is shown below). Default value is CPU. Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The demo will look for a suitable plugin for a specified device.
+    -delay                    Optional. Default is 1. Interval in milliseconds of waiting for a key to be pressed. For a negative value the demo loads a model, opens an input and exits.
+    -no_show                  Optional. Do not visualize inference results.
+    -u                        Optional. List of monitors to show initially.
 ```
 
-Running the application with the empty list of options yields the usage message given above and an error message.
+Running the application with the empty list of options yields an error message.
 
-To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/).
+To run the demo, you can use public or pre-trained models. To download the pre-trained models, use the OpenVINO [Model Downloader](../../tools/downloader/README.md) or go to [https://download.01.org/opencv/](https://download.01.org/opencv/). The list of models supported by the demo is in [models.lst](./models.lst).
 
 > **NOTE**: Before running the demo with a trained model, make sure the model is converted to the Inference Engine format (\*.xml + \*.bin) using the [Model Optimizer tool](https://docs.openvinotoolkit.org/latest/_docs_MO_DG_Deep_Learning_Model_Optimizer_DevGuide.html).
 
-You can use the following command to do inference on CPU on an image using a trained FCN8 network:
+You can use the following command to do inference on CPU on images captured by a camera using a pre-trained semantic-segmentation-adas-0001 network:
 ```sh
-./segmentation_demo -i <path_to_image>/inputImage.bmp -m <path_to_model>/fcn8.xml
+./segmentation_demo -i 0 -m semantic-segmentation-adas-0001.xml
 ```
 
 ## Demo Output
 
-The application outputs are a segmented image (`out.bmp`).
+The demo uses OpenCV to display the resulting images with blended segmentation mask.
 
 > **NOTE**: On VPU devices (Intel® Movidius™ Neural Compute Stick, Intel® Neural Compute Stick 2, and Intel® Vision Accelerator Design with Intel® Movidius™ VPUs) this demo is not supported with any of the Model Downloader available topologies. Other models may produce unexpected results on these devices as well.
 
diff --git a/demos/segmentation_demo/main.cpp b/demos/segmentation_demo/main.cpp
index 973f94dbc06..794a2e3f1e5 100644
--- a/demos/segmentation_demo/main.cpp
+++ b/demos/segmentation_demo/main.cpp
@@ -2,31 +2,25 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include <gflags/gflags.h>
 #include <iostream>
-#include <memory>
-#include <map>
 #include <string>
 #include <vector>
-#include <iomanip>
 
-#include <inference_engine.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
+#include <gflags/gflags.h>
 
-#include <format_reader_ptr.h>
+#include <opencv2/videoio.hpp>
 
+#include <inference_engine.hpp>
+
+#include <monitors/presenter.h>
 #include <samples/common.hpp>
+#include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
-#include <samples/args_helper.hpp>
-
-#include <vpu/vpu_tools_common.hpp>
-#include <vpu/vpu_plugin_config.hpp>
 
 #include "segmentation_demo.h"
 
 using namespace InferenceEngine;
+typedef std::chrono::duration<double, std::chrono::milliseconds::period> Ms;
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
     // ---------------------------Parsing and validation of input args--------------------------------------
@@ -50,48 +44,15 @@ bool ParseAndCheckCommandLine(int argc, char *argv[]) {
     return true;
 }
 
-static std::map<std::string, std::string> configure(const std::string& confFileName) {
-    auto config = parseConfig(confFileName);
-
-    return config;
-}
-
-/**
- * @brief The entry point for inference engine deconvolution demo application
- * @file segmentation_demo/main.cpp
- * @example segmentation_demo/main.cpp
- */
 int main(int argc, char *argv[]) {
     try {
         slog::info << "InferenceEngine: " << GetInferenceEngineVersion() << slog::endl;
-
-        // ------------------------------ Parsing and validation of input args ---------------------------------
         if (!ParseAndCheckCommandLine(argc, argv)) {
             return 0;
         }
 
-        /** This vector stores paths to the processed images **/
-        std::vector<std::string> images;
-        parseInputFilesArguments(images);
-        if (images.empty()) throw std::logic_error("No suitable images were found");
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 1. Load inference engine -------------------------------------
-        slog::info << "Loading Inference Engine" << slog::endl;
         Core ie;
 
-#ifdef WITH_EXTENSIONS
-        /** Loading default extensions **/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-             * cpu_extensions library is compiled from "extension" folder containing
-             * custom MKLDNNPlugin layer implementations. These layers are not supported
-             * by mkldnn, but they can be useful for inferring custom topologies.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
             IExtensionPtr extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -104,184 +65,161 @@ int main(int argc, char *argv[]) {
             slog::info << "GPU Extension loaded: " << FLAGS_c << slog::endl;
         }
 
-        /** Printing device version **/
-
         slog::info << "Device info" << slog::endl;
         std::cout << ie.GetVersions(FLAGS_d);
 
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 2. Read IR Generated by ModelOptimizer (.xml and .bin files) ------------
-        slog::info << "Loading network files" << slog::endl;
-
-        CNNNetReader networkReader;
-        /** Read network model **/
-        networkReader.ReadNetwork(FLAGS_m);
-
-        /** Extract model name and load weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        networkReader.ReadWeights(binFileName);
-        CNNNetwork network = networkReader.getNetwork();
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 3. Configure input & output ---------------------------------------------
-
-        // --------------------------- Prepare input blobs -----------------------------------------------------
-        slog::info << "Preparing input blobs" << slog::endl;
-
-        /** Taking information about all topology inputs **/
-        InputsDataMap inputInfo(network.getInputsInfo());
-        /** Stores all input blobs data **/
-        BlobMap inputBlobs;
-
-        if (inputInfo.size() != 1) throw std::logic_error("Demo supports topologies only with 1 input");
-        auto inputInfoItem = *inputInfo.begin();
-
-        /** Collect images data ptrs **/
-        std::vector<std::shared_ptr<unsigned char>> imagesData;
-        for (auto & i : images) {
-            FormatReader::ReaderPtr reader(i.c_str());
-            if (reader.get() == nullptr) {
-                slog::warn << "Image " + i + " cannot be read!" << slog::endl;
-                continue;
-            }
-            /** Getting image data **/
-            std::shared_ptr<unsigned char> data(reader->getData(inputInfoItem.second->getTensorDesc().getDims()[3],
-                                                                inputInfoItem.second->getTensorDesc().getDims()[2]));
-            if (data.get() != nullptr) {
-                imagesData.push_back(data);
-            }
-        }
-        if (imagesData.empty()) throw std::logic_error("Valid input images were not found!");
-
-        /** Setting batch size using image count **/
-        network.setBatchSize(imagesData.size());
-        slog::info << "Batch size is " << std::to_string(networkReader.getNetwork().getBatchSize()) << slog::endl;
-
-        inputInfoItem.second->setPrecision(Precision::U8);
-
-        // --------------------------- Prepare output blobs ----------------------------------------------------
-        slog::info << "Preparing output blobs" << slog::endl;
-
-        OutputsDataMap outputInfo(network.getOutputsInfo());
-        // BlobMap outputBlobs;
-        std::string firstOutputName;
-
-        for (auto & item : outputInfo) {
-            if (firstOutputName.empty()) {
-                firstOutputName = item.first;
-            }
-            DataPtr outputData = item.second;
-            if (!outputData) {
-                throw std::logic_error("output data pointer is not valid");
-            }
-
-            item.second->setPrecision(Precision::FP32);
+        CNNNetwork network = ie.ReadNetwork(FLAGS_m);
+
+        ICNNNetwork::InputShapes inputShapes = network.getInputShapes();
+        if (inputShapes.size() != 1)
+            throw std::runtime_error("Demo supports topologies only with 1 input");
+        const std::string& inName = inputShapes.begin()->first;
+        SizeVector& inSizeVector = inputShapes.begin()->second;
+        if (inSizeVector.size() != 4 || inSizeVector[1] != 3)
+            throw std::runtime_error("3-channel 4-dimensional model's input is expected");
+        inSizeVector[0] = 1;  // set batch size to 1
+        network.reshape(inputShapes);
+
+        InputInfo& inputInfo = *network.getInputsInfo().begin()->second;
+        inputInfo.getPreProcess().setResizeAlgorithm(ResizeAlgorithm::RESIZE_BILINEAR);
+        inputInfo.setLayout(Layout::NHWC);
+        inputInfo.setPrecision(Precision::U8);
+
+        const OutputsDataMap& outputsDataMap = network.getOutputsInfo();
+        if (outputsDataMap.size() != 1) throw std::runtime_error("Demo supports topologies only with 1 output");
+        const std::string& outName = outputsDataMap.begin()->first;
+        Data& data = *outputsDataMap.begin()->second;
+        // if the model performs ArgMax, its output type can be I32 but for models that return heatmaps for each
+        // class the output is usually FP32. Reset the precision to avoid handling different types with switch in
+        // postprocessing
+        data.setPrecision(Precision::FP32);
+        const SizeVector& outSizeVector = data.getTensorDesc().getDims();
+        int outChannels, outHeight, outWidth;
+        switch(outSizeVector.size()) {
+            case 3:
+                outChannels = 0;
+                outHeight = outSizeVector[1];
+                outWidth = outSizeVector[2];
+                break;
+            case 4:
+                outChannels = outSizeVector[1];
+                outHeight = outSizeVector[2];
+                outWidth = outSizeVector[3];
+                break;
+            default:
+                throw std::runtime_error("Unexpected output blob shape. Only 4D and 3D output blobs are"
+                    "supported.");
         }
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 4. Loading model to the device ------------------------------------------
-        slog::info << "Loading model to the device" << slog::endl;
-        ExecutableNetwork executable_network = ie.LoadNetwork(network, FLAGS_d, configure(FLAGS_config));
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 5. Create infer request -------------------------------------------------
-        slog::info << "Create infer request" << slog::endl;
-        InferRequest infer_request = executable_network.CreateInferRequest();
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 6. Prepare input --------------------------------------------------------
-        /** Iterate over all the input blobs **/
-        /** Iterating over all input blobs **/
-        for (const auto & item : inputInfo) {
-            /** Creating input blob **/
-            Blob::Ptr input = infer_request.GetBlob(item.first);
-
-            /** Fill input tensor with images. First r channel, then g and b channels **/
-            size_t num_channels = input->getTensorDesc().getDims()[1];
-            size_t image_size = input->getTensorDesc().getDims()[3] * input->getTensorDesc().getDims()[2];
-
-            auto data = input->buffer().as<PrecisionTrait<Precision::U8>::value_type*>();
 
-            /** Iterate over all input images **/
-            for (size_t image_id = 0; image_id < imagesData.size(); ++image_id) {
-                /** Iterate over all pixel in image (r,g,b) **/
-                for (size_t pid = 0; pid < image_size; pid++) {
-                    /** Iterate over all channels **/
-                    for (size_t ch = 0; ch < num_channels; ++ch) {
-                        /**          [images stride + channels stride + pixel id ] all in bytes            **/
-                        data[image_id * image_size * num_channels + ch * image_size + pid] = imagesData.at(image_id).get()[pid*num_channels + ch];
-                    }
-                }
-            }
+        ExecutableNetwork executableNetwork = ie.LoadNetwork(network, FLAGS_d);
+        InferRequest inferRequest = executableNetwork.CreateInferRequest();
+
+        cv::VideoCapture cap;
+        try {
+            int index = std::stoi(FLAGS_i);
+            if (!cap.open(index))
+                throw std::runtime_error("Can't open camera " + std::to_string(index));
+        } catch (const std::invalid_argument&) {
+            if (!cap.open(FLAGS_i))
+                throw std::runtime_error("Can't open input " + FLAGS_i);
+        } catch (const std::out_of_range&) {
+            if (!cap.open(FLAGS_i))
+                throw std::runtime_error("Can't open input " + FLAGS_i);
         }
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 7. Do inference ---------------------------------------------------------
-        slog::info << "Start inference" << slog::endl;
-        infer_request.Infer();
-        // -----------------------------------------------------------------------------------------------------
-
-        // --------------------------- 8. Process output -------------------------------------------------------
-        slog::info << "Processing output blobs" << slog::endl;
-
-        const Blob::Ptr output_blob = infer_request.GetBlob(firstOutputName);
-        const auto output_data = output_blob->buffer().as<float*>();
 
-        size_t N = output_blob->getTensorDesc().getDims().at(0);
-        size_t C, H, W;
-
-        size_t output_blob_shape_size = output_blob->getTensorDesc().getDims().size();
-        slog::info << "Output blob has " << output_blob_shape_size << " dimensions" << slog::endl;
-
-        if (output_blob_shape_size == 3) {
-            C = 1;
-            H = output_blob->getTensorDesc().getDims().at(1);
-            W = output_blob->getTensorDesc().getDims().at(2);
-        } else if (output_blob_shape_size == 4) {
-            C = output_blob->getTensorDesc().getDims().at(1);
-            H = output_blob->getTensorDesc().getDims().at(2);
-            W = output_blob->getTensorDesc().getDims().at(3);
-        } else {
-            throw std::logic_error("Unexpected output blob shape. Only 4D and 3D output blobs are supported.");
+        float blending = 0.3f;
+        constexpr char WIN_NAME[] = "segmentation";
+        if (!FLAGS_no_show) {
+            cv::namedWindow(WIN_NAME);
+            int initValue = static_cast<int>(blending * 100);
+            cv::createTrackbar("blending", WIN_NAME, &initValue, 100,
+                [](int position, void* blendingPtr){*static_cast<float*>(blendingPtr) = position * 0.01f;},
+                &blending);
         }
 
-        size_t image_stride = W*H*C;
-
-        /** Iterating over all images **/
-        for (size_t image = 0; image < N; ++image) {
-            /** This vector stores pixels classes **/
-            std::vector<std::vector<size_t>> outArrayClasses(H, std::vector<size_t>(W, 0));
-            std::vector<std::vector<float>> outArrayProb(H, std::vector<float>(W, 0.));
-            /** Iterating over each pixel **/
-            for (size_t w = 0; w < W; ++w) {
-                for (size_t h = 0; h < H; ++h) {
-                    /* number of channels = 1 means that the output is already ArgMax'ed */
-                    if (C == 1) {
-                        outArrayClasses[h][w] = static_cast<size_t>(output_data[image_stride * image + W * h + w]);
+        cv::Mat inImg, resImg, maskImg(outHeight, outWidth, CV_8UC3);
+        std::vector<cv::Vec3b> colors(arraySize(CITYSCAPES_COLORS));
+        for (std::size_t i = 0; i < colors.size(); ++i)
+            colors[i] = {CITYSCAPES_COLORS[i].blue(), CITYSCAPES_COLORS[i].green(), CITYSCAPES_COLORS[i].red()};
+        std::mt19937 rng;
+        std::uniform_int_distribution<int> distr(0, 255);
+        int delay = FLAGS_delay;
+        cv::Size graphSize{static_cast<int>(cap.get(cv::CAP_PROP_FRAME_WIDTH) / 4), 60};
+        Presenter presenter(FLAGS_u, 10, graphSize);
+
+        std::chrono::steady_clock::duration latencySum{0};
+        unsigned latencySamplesNum = 0;
+        std::ostringstream latencyStream;
+
+        std::chrono::steady_clock::time_point t0 = std::chrono::steady_clock::now();
+        while (cap.read(inImg) && delay >= 0) {
+            if (CV_8UC3 != inImg.type())
+                throw std::runtime_error("BGR (or RGB) image expected to come from input");
+            inferRequest.SetBlob(inName, wrapMat2Blob(inImg));
+            inferRequest.Infer();
+
+            const float * const predictions = inferRequest.GetBlob(outName)->cbuffer().as<float*>();
+            for (int rowId = 0; rowId < outHeight; ++rowId) {
+                for (int colId = 0; colId < outWidth; ++colId) {
+                    std::size_t classId = 0;
+                    if (outChannels == 0) {  // assume the output is already ArgMax'ed
+                        classId = static_cast<std::size_t>(predictions[rowId * outWidth + colId]);
                     } else {
-                        /** Iterating over each class probability **/
-                        for (size_t ch = 0; ch < C; ++ch) {
-                            auto data = output_data[image_stride * image + W * H * ch + W * h + w];
-                            if (data > outArrayProb[h][w]) {
-                                outArrayClasses[h][w] = ch;
-                                outArrayProb[h][w] = data;
+                        float maxProb = -1.0f;
+                        for (int chId = 0; chId < outChannels; ++chId) {
+                            float prob = predictions[chId * outHeight * outWidth + rowId * outWidth + colId];
+                            if (prob > maxProb) {
+                                classId = chId;
+                                maxProb = prob;
                             }
                         }
                     }
+                    while (classId >= colors.size()) {
+                        cv::Vec3b color(distr(rng), distr(rng), distr(rng));
+                        colors.push_back(color);
+                    }
+                    maskImg.at<cv::Vec3b>(rowId, colId) = colors[classId];
                 }
             }
-            /** Dump resulting image **/
-            std::string fileName = "out_" + std::to_string(image) + ".bmp";
-            std::ofstream outFile(fileName, std::ofstream::binary);
-            if (!outFile.is_open()) {
-                throw std::logic_error("Can't open file : " + fileName);
+            cv::resize(maskImg, resImg, inImg.size());
+            resImg = inImg * blending + resImg * (1 - blending);
+            presenter.drawGraphs(resImg);
+
+            latencySum += std::chrono::steady_clock::now() - t0;
+            ++latencySamplesNum;
+            latencyStream.str("");
+            latencyStream << std::fixed << std::setprecision(1)
+                << (std::chrono::duration_cast<Ms>(latencySum) / latencySamplesNum).count() << " ms";
+            constexpr int FONT_FACE = cv::FONT_HERSHEY_SIMPLEX;
+            constexpr double FONT_SCALE = 2;
+            constexpr int THICKNESS = 2;
+            int baseLine;
+            cv::getTextSize(latencyStream.str(), FONT_FACE, FONT_SCALE, THICKNESS, &baseLine);
+            cv::putText(resImg, latencyStream.str(), cv::Size{0, resImg.rows - baseLine}, FONT_FACE, FONT_SCALE,
+                cv::Scalar{255, 0, 0}, THICKNESS);
+
+            if (!FLAGS_no_show) {
+                cv::imshow(WIN_NAME, resImg);
+                int key = cv::waitKey(delay);
+                switch(key) {
+                    case 'q':
+                    case 'Q':
+                    case 27: // Esc
+                        delay = -1;
+                        break;
+                    case 'p':
+                    case 'P':
+                    case 32: // Space
+                        delay = !delay * (FLAGS_delay + !FLAGS_delay);
+                        break;
+                    default:
+                        presenter.handleKey(key);
+                }
             }
-
-            writeOutputBmp(outArrayClasses, C, outFile);
-            slog::info << "File : " << fileName << " was created" << slog::endl;
+            t0 = std::chrono::steady_clock::now();
         }
-        // -----------------------------------------------------------------------------------------------------
+        std::cout << "Mean pipeline latency: " << latencyStream.str() << '\n';
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         slog::err << error.what() << slog::endl;
@@ -293,7 +231,5 @@ int main(int argc, char *argv[]) {
     }
 
     slog::info << "Execution successful" << slog::endl;
-    slog::info << slog::endl << "This demo is an API example, for any performance measurements "
-                                "please use the dedicated benchmark_app tool from the openVINO toolkit" << slog::endl;
     return 0;
 }
diff --git a/demos/segmentation_demo/models.lst b/demos/segmentation_demo/models.lst
index a6975de59eb..b695bc84a77 100644
--- a/demos/segmentation_demo/models.lst
+++ b/demos/segmentation_demo/models.lst
@@ -1,3 +1,4 @@
 # This file can be used with the --list option of the model downloader.
+deeplabv3
 road-segmentation-adas-????
 semantic-segmentation-adas-????
diff --git a/demos/segmentation_demo/segmentation_demo.h b/demos/segmentation_demo/segmentation_demo.h
index 0a1848f92bc..39fec9e3ffb 100644
--- a/demos/segmentation_demo/segmentation_demo.h
+++ b/demos/segmentation_demo/segmentation_demo.h
@@ -9,70 +9,47 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
+static const char input_message[] = "Required. Input to process.";
+static const char model_message[] = "Required. Path to an .xml file with a trained model.";
+static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
+                                            "The demo will look for a suitable plugin for a specified device.";
+static const char custom_cldnn_message[] = "Required for GPU custom kernels. "
+                                           "Absolute path to the .xml file with the kernels descriptions.";
+static const char custom_cpu_library_message[] = "Required for CPU custom layers. "
+                                                 "Absolute path to a shared library with the kernels implementations.";
+static const char config_message[] = "Path to the configuration file. Default vaelue: \"config\".";
+static const char delay_message[] = "Optional. Default is 1. Interval in milliseconds of waiting for a key to be "
+                                    "pressed. For a negative value the demo loads a model, opens an input and "
+                                    "exits.";
+static const char no_show_message[] = "Optional. Do not visualize inference results.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// @brief message for images argument
-static const char image_message[] = "Required. Path to an .bmp image.";
-
-/// @brief message for model argument
-static const char model_message[] = "Required. Path to an .xml file with a trained model.";\
-
-/// @brief message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). " \
-"Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
-"The demo will look for a suitable plugin for a specified device.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels. "\
-"Absolute path to the .xml file with the kernels descriptions.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers. " \
-"Absolute path to a shared library with the kernels implementations.";
-
-/// @brief message for config argument
-static constexpr char config_message[] = "Path to the configuration file. Default value: \"config\".";
-
-/// @brief Define parameter for clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
-DEFINE_string(i, "", image_message);
-
-/// @brief Define parameter for set model file <br>
-/// It is a required parameter
+DEFINE_string(i, "", input_message);
 DEFINE_string(m, "", model_message);
-
-/// @brief device the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief Define path to plugin config
 DEFINE_string(config, "", config_message);
+DEFINE_int32(delay, 1, delay_message);
+DEFINE_bool(no_show, false, no_show_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
-
-/**
-* @brief This function show a help message
-*/
 static void showUsage() {
     std::cout << std::endl;
     std::cout << "segmentation_demo [OPTION]" << std::endl;
     std::cout << "Options:" << std::endl;
     std::cout << std::endl;
     std::cout << "    -h                        " << help_message << std::endl;
-    std::cout << "    -i \"<path>\"               " << image_message << std::endl;
+    std::cout << "    -i \"<path>\"               " << input_message << std::endl;
     std::cout << "    -m \"<path>\"               " << model_message << std::endl;
     std::cout << "      -l \"<absolute_path>\"    " << custom_cpu_library_message << std::endl;
     std::cout << "          Or" << std::endl;
     std::cout << "      -c \"<absolute_path>\"    " << custom_cldnn_message << std::endl;
     std::cout << "    -d \"<device>\"             " << target_device_message << std::endl;
+    std::cout << "    -delay                    " << delay_message << std::endl;
+    std::cout << "    -no_show                  " << no_show_message << std::endl;
+    std::cout << "    -u                        " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/smart_classroom_demo/CMakeLists.txt b/demos/smart_classroom_demo/CMakeLists.txt
index a8d7168991d..00061a20ef5 100644
--- a/demos/smart_classroom_demo/CMakeLists.txt
+++ b/demos/smart_classroom_demo/CMakeLists.txt
@@ -9,5 +9,5 @@ ie_add_sample(NAME smart_classroom_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
               INCLUDE_DIRECTORIES "${CMAKE_CURRENT_SOURCE_DIR}/include"
-              DEPENDENCIES format_reader
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/smart_classroom_demo/README.md b/demos/smart_classroom_demo/README.md
index 8a1c2e94c5f..38282419def 100644
--- a/demos/smart_classroom_demo/README.md
+++ b/demos/smart_classroom_demo/README.md
@@ -29,7 +29,7 @@ To recognize faces on a frame, the demo needs a gallery of reference images. Eac
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./smart_classroom_demo -h
 InferenceEngine:
     API version ............ <version>
@@ -52,6 +52,7 @@ Options:
     -d_lm '<device>'               Optional. Specify the target device for Landmarks Regression Retail (the list of available devices is shown below). Default value is CPU. Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The application looks for a suitable plugin for the specified device.
     -d_reid '<device>'             Optional. Specify the target device for Face Reidentification Retail (the list of available devices is shown below). Default value is CPU. Use "-d HETERO:<comma-separated_devices_list>" format to specify HETERO plugin. The application looks for a suitable plugin for the specified device.
     -out_v  '<path>'               Optional. File to write output video with visualization to.
+    -greedy_reid_matching          Optional. Use faster greedy matching algorithm in face reid.
     -pc                            Optional. Enables per-layer performance statistics.
     -r                             Optional. Output Inference results as raw values.
     -ad                            Optional. Output file name to save per-person action statistics in.
@@ -77,6 +78,7 @@ Options:
     -min_size_fr                   Optional. Minimum input size for faces during database registration.
     -al                            Optional. Output file name to save per-person action detections in.
     -ss_t                          Optional. Number of frames to smooth actions.
+    -u                             Optional. List of monitors to show initially.
 ```
 
 Running the application with the empty list of options yields an error message.
diff --git a/demos/smart_classroom_demo/create_list.py b/demos/smart_classroom_demo/create_list.py
index 93d5a8df00a..5ed3228909d 100755
--- a/demos/smart_classroom_demo/create_list.py
+++ b/demos/smart_classroom_demo/create_list.py
@@ -41,4 +41,4 @@
         objects[label] = [path]
 
 with open('faces_gallery.json', 'w') as outfile:
-    json.dump(objects, outfile)
+    json.dump(objects, outfile, indent=4)
diff --git a/demos/smart_classroom_demo/include/action_detector.hpp b/demos/smart_classroom_demo/include/action_detector.hpp
index e50337301c0..c14e49d31e5 100644
--- a/demos/smart_classroom_demo/include/action_detector.hpp
+++ b/demos/smart_classroom_demo/include/action_detector.hpp
@@ -55,9 +55,9 @@ using SSDHeads = std::vector<SSDHead>;
 * @brief Config for the Action Detection model
 */
 struct ActionDetectorConfig : public CnnConfig {
-    explicit ActionDetectorConfig(const std::string& path_to_model,
-                                  const std::string& path_to_weights)
-        : CnnConfig(path_to_model, path_to_weights) {}
+    explicit ActionDetectorConfig(const std::string& path_to_model)
+        : CnnConfig(path_to_model) {}
+
     /** @brief Name of output blob with location info */
     std::string old_loc_blob_name{"mbox_loc1/out/conv/flat"};
     /** @brief Name of output blob with detection confidence info */
@@ -95,7 +95,7 @@ struct ActionDetectorConfig : public CnnConfig {
     /** @brief Number of SSD anchors for the new network version */
     std::vector<int> new_anchors{1, 4};
     /** @brief Number of actions to detect */
-    int num_action_classes = 3;
+    size_t num_action_classes = 3;
     /** @brief Async execution flag */
     bool is_async = true;
     /** @brief  SSD bbox encoding variances */
@@ -108,14 +108,17 @@ struct ActionDetectorConfig : public CnnConfig {
 };
 
 
-class ActionDetection : public BaseCnnDetection {
+class ActionDetection : public AsyncDetection<DetectedAction>, public BaseCnnDetection {
 public:
     explicit ActionDetection(const ActionDetectorConfig& config);
 
-    DetectedActions results;
     void submitRequest() override;
-    void enqueue(const cv::Mat &frame);
-    void fetchResults();
+    void enqueue(const cv::Mat &frame) override;
+    void wait() override { BaseCnnDetection::wait(); }
+    void printPerformanceCounts(const std::string &fullDeviceName) override {
+        BaseCnnDetection::printPerformanceCounts(fullDeviceName);
+    }
+    DetectedActions fetchResults() override;
 
 private:
     ActionDetectorConfig config_;
@@ -126,7 +129,6 @@ class ActionDetection : public BaseCnnDetection {
     int enqueued_frames_ = 0;
     float width_ = 0;
     float height_ = 0;
-    bool results_fetched_ = false;
     bool new_network_ = false;
     std::vector<int> head_ranges_;
     std::vector<int> head_step_sizes_;
@@ -157,14 +159,13 @@ class ActionDetection : public BaseCnnDetection {
     * @param add_conf Action conf buffer
     * @param priorboxes Priorboxes buffer
     * @param frame_size Size of input image (WxH)
-    * @param detections Detected objects
+    * @return Detected objects
     */
-    void GetDetections(const cv::Mat& loc,
-                       const cv::Mat& main_conf,
-                       const cv::Mat& priorboxes,
-                       const std::vector<cv::Mat>& add_conf,
-                       const cv::Size& frame_size,
-                       DetectedActions* detections) const;
+    DetectedActions GetDetections(const cv::Mat& loc,
+                                  const cv::Mat& main_conf,
+                                  const cv::Mat& priorboxes,
+                                  const std::vector<cv::Mat>& add_conf,
+                                  const cv::Size& frame_size) const;
 
      /**
     * @brief Translate input buffer to BBox
diff --git a/demos/smart_classroom_demo/include/cnn.hpp b/demos/smart_classroom_demo/include/cnn.hpp
index d60e87d7e47..8d563f355e8 100644
--- a/demos/smart_classroom_demo/include/cnn.hpp
+++ b/demos/smart_classroom_demo/include/cnn.hpp
@@ -18,18 +18,13 @@
 * @brief Base class of config for network
 */
 struct CnnConfig {
-    explicit CnnConfig(const std::string& path_to_model,
-                       const std::string& path_to_weights)
-        : path_to_model(path_to_model), path_to_weights(path_to_weights) {}
+    explicit CnnConfig(const std::string& path_to_model)
+        : path_to_model(path_to_model) {}
 
     /** @brief Path to model description */
     std::string path_to_model;
-    /** @brief Path to model weights */
-    std::string path_to_weights;
     /** @brief Maximal size of batch */
     int max_batch_size{1};
-    /** @brief Enabled/disabled status */
-    bool enabled{true};
 
     /** @brief Inference Engine */
     InferenceEngine::Core ie;
@@ -64,11 +59,6 @@ class CnnDLSDKBase {
     */
     void PrintPerformanceCounts(std::string fullDeviceName) const;
 
-    /**
-    * @brief Indicates whether model enabled or not
-    */
-    bool Enabled() const;
-
 protected:
     /**
    * @brief Run network
@@ -77,7 +67,7 @@ class CnnDLSDKBase {
    * @param results_fetcher Callback to fetch inference results
    */
     void Infer(const cv::Mat& frame,
-               std::function<void(const InferenceEngine::BlobMap&, size_t)> results_fetcher) const;
+               const std::function<void(const InferenceEngine::BlobMap&, size_t)>& results_fetcher) const;
 
     /**
    * @brief Run network in batch mode
@@ -86,7 +76,7 @@ class CnnDLSDKBase {
    * @param results_fetcher Callback to fetch inference results
    */
     void InferBatch(const std::vector<cv::Mat>& frames,
-                    std::function<void(const InferenceEngine::BlobMap&, size_t)> results_fetcher) const;
+                    const std::function<void(const InferenceEngine::BlobMap&, size_t)>& results_fetcher) const;
 
     /** @brief Config */
     Config config_;
@@ -114,21 +104,43 @@ class VectorCNN : public CnnDLSDKBase {
                  std::vector<cv::Mat>* vectors, cv::Size outp_shape = cv::Size()) const;
 };
 
-class BaseCnnDetection {
+class AsyncAlgorithm {
+public:
+    virtual ~AsyncAlgorithm() {}
+    virtual void enqueue(const cv::Mat &frame) = 0;
+    virtual void submitRequest() = 0;
+    virtual void wait() = 0;
+    virtual void printPerformanceCounts(const std::string &fullDeviceName) = 0;
+};
+
+template <typename T>
+class AsyncDetection : public AsyncAlgorithm {
+public:
+    virtual std::vector<T> fetchResults() = 0;
+};
+
+template <typename T>
+class NullDetection : public AsyncDetection<T> {
+public:
+    void enqueue(const cv::Mat &) override {}
+    void submitRequest() override {}
+    void wait() override {}
+    void printPerformanceCounts(const std::string &) override {}
+    std::vector<T> fetchResults() override { return {}; }
+};
+
+class BaseCnnDetection : public AsyncAlgorithm {
 protected:
     InferenceEngine::InferRequest::Ptr request;
     const bool isAsync;
-    const bool enabledFlag;
     std::string topoName;
 
 public:
-    explicit BaseCnnDetection(bool enabled = true, bool isAsync = false) :
-                              isAsync(isAsync), enabledFlag(enabled) {}
+    explicit BaseCnnDetection(bool isAsync = false) :
+                              isAsync(isAsync) {}
 
-    virtual ~BaseCnnDetection() {}
-
-    virtual void submitRequest() {
-        if (!enabled() || request == nullptr) return;
+    void submitRequest() override {
+        if (request == nullptr) return;
         if (isAsync) {
             request->StartAsync();
         } else {
@@ -136,19 +148,12 @@ class BaseCnnDetection {
         }
     }
 
-    virtual void wait() {
-        if (!enabled()|| !request || !isAsync) return;
+    void wait() override {
+        if (!request || !isAsync) return;
         request->Wait(InferenceEngine::IInferRequest::WaitMode::RESULT_READY);
     }
 
-    bool enabled() const  {
-        return enabledFlag;
-    }
-
-    void PrintPerformanceCounts(std::string fullDeviceName) {
-        if (!enabled()) {
-            return;
-        }
+    void printPerformanceCounts(const std::string &fullDeviceName) override {
         std::cout << "Performance counts for " << topoName << std::endl << std::endl;
         ::printPerformanceCounts(*request, std::cout, fullDeviceName, false);
     }
diff --git a/demos/smart_classroom_demo/include/detector.hpp b/demos/smart_classroom_demo/include/detector.hpp
index a75e54ce857..6dc6949266c 100644
--- a/demos/smart_classroom_demo/include/detector.hpp
+++ b/demos/smart_classroom_demo/include/detector.hpp
@@ -25,9 +25,8 @@ struct DetectedObject {
 using DetectedObjects = std::vector<DetectedObject>;
 
 struct DetectorConfig : public CnnConfig {
-    explicit DetectorConfig(const std::string& path_to_model,
-                            const std::string& path_to_weights)
-        : CnnConfig(path_to_model, path_to_weights) {}
+    explicit DetectorConfig(const std::string& path_to_model)
+        : CnnConfig(path_to_model) {}
 
     float confidence_threshold{0.6f};
     float increase_scale_x{1.15f};
@@ -37,7 +36,7 @@ struct DetectorConfig : public CnnConfig {
     int input_w = 600;
 };
 
-class FaceDetection : public BaseCnnDetection {
+class FaceDetection : public AsyncDetection<DetectedObject>, public BaseCnnDetection {
 private:
     DetectorConfig config_;
     InferenceEngine::ExecutableNetwork net_;
@@ -48,15 +47,18 @@ class FaceDetection : public BaseCnnDetection {
     int enqueued_frames_ = 0;
     float width_ = 0;
     float height_ = 0;
-    bool results_fetched_ = false;
 
 public:
     explicit FaceDetection(const DetectorConfig& config);
 
-    DetectedObjects results;
     void submitRequest() override;
-    void enqueue(const cv::Mat &frame);
-    void fetchResults();
+    void enqueue(const cv::Mat &frame) override;
+    void wait() override { BaseCnnDetection::wait(); }
+    void printPerformanceCounts(const std::string &fullDeviceName) override {
+        BaseCnnDetection::printPerformanceCounts(fullDeviceName);
+    }
+
+    DetectedObjects fetchResults() override;
 };
 
 }  // namespace detection
diff --git a/demos/smart_classroom_demo/include/face_reid.hpp b/demos/smart_classroom_demo/include/face_reid.hpp
index c89ac0fcc79..c0a358d05f2 100644
--- a/demos/smart_classroom_demo/include/face_reid.hpp
+++ b/demos/smart_classroom_demo/include/face_reid.hpp
@@ -34,9 +34,10 @@ class EmbeddingsGallery {
     static const char unknown_label[];
     static const int unknown_id;
     EmbeddingsGallery(const std::string& ids_list, double threshold, int min_size_fr,
-                      bool crop_gallery, detection::FaceDetection& detector,
+                      bool crop_gallery, const detection::DetectorConfig &detector_config,
                       const VectorCNN& landmarks_det,
-                      const VectorCNN& image_reid);
+                      const VectorCNN& image_reid,
+                      bool use_greedy_matcher=false);
     size_t size() const;
     std::vector<int> GetIDsByEmbeddings(const std::vector<cv::Mat>& embeddings) const;
     std::string GetLabelByID(int id) const;
@@ -55,6 +56,7 @@ class EmbeddingsGallery {
     std::vector<int> idx_to_id;
     double reid_threshold;
     std::vector<GalleryObject> identities;
+    bool use_greedy_matcher;
 };
 
 void AlignFaces(std::vector<cv::Mat>* face_images,
diff --git a/demos/smart_classroom_demo/include/image_grabber.hpp b/demos/smart_classroom_demo/include/image_grabber.hpp
index c8809b3249f..b83b5b6cc77 100644
--- a/demos/smart_classroom_demo/include/image_grabber.hpp
+++ b/demos/smart_classroom_demo/include/image_grabber.hpp
@@ -14,7 +14,6 @@ class ImageGrabber {
     bool GrabNext();
     bool Retrieve(cv::Mat& img);
     bool IsOpened() const;
-    int GetFrameIndex() const;
     int GetFPS() const;
     std::string GetVideoPath() const;
 
@@ -27,7 +26,4 @@ class ImageGrabber {
     std::vector<std::vector<int>> frames;
     int current_video_idx;
     int current_frame_idx;
-    int cap_frame_index;
-
-    bool NextVideo();
 };
diff --git a/demos/smart_classroom_demo/include/smart_classroom_demo.hpp b/demos/smart_classroom_demo/include/smart_classroom_demo.hpp
index 37a717eaf1a..80fd7c3ac40 100644
--- a/demos/smart_classroom_demo/include/smart_classroom_demo.hpp
+++ b/demos/smart_classroom_demo/include/smart_classroom_demo.hpp
@@ -9,281 +9,104 @@
 #include <vector>
 #include <gflags/gflags.h>
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief Message for images argument
 static const char video_message[] = "Required. Path to a video or image file. Default value is \"cam\" to work with camera.";
-
-/// @brief Message for model argument
 static const char person_action_detection_model_message[] = "Required. Path to the Person/Action Detection Retail model (.xml) file.";
 static const char face_detection_model_message[] = "Required. Path to the Face Detection Retail model (.xml) file.";
 static const char facial_landmarks_model_message[] = "Required. Path to the Facial Landmarks Regression Retail model (.xml) file.";
 static const char face_reid_model_message[] = "Required. Path to the Face Reidentification Retail model (.xml) file.";
-
-/// @brief Message for assigning Person/Action detection inference to device
-static const char target_device_message_action_detection[] = "Optional. Specify the target device for Person/Action Detection Retail "\
-                                                             "(the list of available devices is shown below).Default value is CPU. " \
-                                                             "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_action_detection[] = "Optional. Specify the target device for Person/Action Detection Retail "
+                                                             "(the list of available devices is shown below).Default value is CPU. "
+                                                             "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                              "The application looks for a suitable plugin for the specified device.";
-
-/// @brief Message for assigning Face Detection inference to device
-static const char target_device_message_face_detection[] = "Optional. Specify the target device for Face Detection Retail "\
-                                                           "(the list of available devices is shown below).Default value is CPU. " \
-                                                           "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_face_detection[] = "Optional. Specify the target device for Face Detection Retail "
+                                                           "(the list of available devices is shown below).Default value is CPU. "
+                                                           "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                            "The application looks for a suitable plugin for the specified device.";
-
-/// @brief Message for assigning Landmarks Regression retail inference to device
-static const char target_device_message_landmarks_regression[] = "Optional. Specify the target device for Landmarks Regression Retail "\
-                                                                 "(the list of available devices is shown below).Default value is CPU. " \
-                                                                 "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_landmarks_regression[] = "Optional. Specify the target device for Landmarks Regression Retail "
+                                                                 "(the list of available devices is shown below).Default value is CPU. "
+                                                                 "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                                  "The application looks for a suitable plugin for the specified device.";
-
-/// @brief Message for assigning Face Reidentification retail inference to device
-static const char target_device_message_face_reid[] = "Optional. Specify the target device for Face Reidentification Retail "\
-                                                      "(the list of available devices is shown below).Default value is CPU. " \
-                                                      "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char target_device_message_face_reid[] = "Optional. Specify the target device for Face Reidentification Retail "
+                                                      "(the list of available devices is shown below).Default value is CPU. "
+                                                      "Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                                       "The application looks for a suitable plugin for the specified device.";
-
-/// @brief Message for performance counters
+static const char greedy_reid_matching_message[] = "Optional. Use faster greedy matching algorithm in face reid.";
 static const char performance_counter_message[] = "Optional. Enables per-layer performance statistics.";
-
-/// @brief Message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Optional. For GPU custom kernels, if any. "\
-"Absolute path to an .xml file with the kernels description.";
-
-/// @brief Message for user library argument
-static const char custom_cpu_library_message[] = "Optional. For CPU custom layers, if any. " \
-"Absolute path to a shared library with the kernels implementation.";
-
-/// @brief Message for probability threshold argument for face detections
+static const char custom_cldnn_message[] = "Optional. For GPU custom kernels, if any. "
+                                           "Absolute path to an .xml file with the kernels description.";
+static const char custom_cpu_library_message[] = "Optional. For CPU custom layers, if any. "
+                                                 "Absolute path to a shared library with the kernels implementation.";
 static const char face_threshold_output_message[] = "Optional. Probability threshold for face detections.";
-
-/// @brief Message for probability threshold argument for person/action detection
 static const char person_threshold_output_message[] = "Optional. Probability threshold for person/action detection.";
-
-// @brief Message for probability threshold argument for action recognition
 static const char action_threshold_output_message[] = "Optional. Probability threshold for action recognition.";
-
-/// @brief Message for cosine distance threshold for face reidentification
 static const char threshold_output_message_face_reid[] = "Optional. Cosine distance threshold between two vectors for face reidentification.";
-
-/// @brief Message for faces gallery path
 static const char reid_gallery_path_message[] = "Optional. Path to a faces gallery in .json format.";
-
-/// @brief Message for output video path
 static const char output_video_message[] = "Optional. File to write output video with visualization to.";
-
-/// @brief Message action statistics output flag
 static const char act_stat_output_message[] = "Optional. Output file name to save per-person action statistics in.";
-
-/// @brief Message raw output flag
 static const char raw_output_message[] = "Optional. Output Inference results as raw values.";
-
-/// @brief Message no show processed video
 static const char no_show_processed_video[] = "Optional. Do not show processed video.";
-
-/// @brief Message input image height for face detector
 static const char input_image_height_output_message[] = "Optional. Input image height for face detector.";
-
-/// @brief Message input image width for face detector
 static const char input_image_width_output_message[] = "Optional. Input image width for face detector.";
-
-/// @brief Message expand ratio for bbox
 static const char expand_ratio_output_message[] = "Optional. Expand ratio for bbox before face recognition.";
-
-/// @brief Message last frame number to handle
 static const char last_frame_message[] = "Optional. Last frame number to handle in demo. If negative, handle all input video.";
-
-/// @brief Message teacher id
 static const char teacher_id_message[] = "Optional. ID of a teacher. You must also set a faces gallery parameter (-fg) to use it.";
-
-/// @brief Message min action duration
 static const char min_action_duration_message[] = "Optional. Minimum action duration in seconds.";
-
-/// @brief Message same action time delta
 static const char same_action_time_delta_message[] = "Optional. Maximum time difference between actions in seconds.";
-
-/// @brief Message student actions
 static const char student_actions_message[] = "Optional. List of student actions separated by a comma.";
-
-/// @brief Message student actions for top-k mode
 static const char top_actions_message[] = "Optional. List of student actions (for top-k mode) separated by a comma.";
-
-/// @brief Message teacher actions
 static const char teacher_actions_message[] = "Optional. List of teacher actions separated by a comma.";
-
-/// @brief Message for target action name for top-k mode
 static const char target_action_name_message[] = "Optional. Target action name.";
-
-/// @brief Message for number of target actions
-static const char target_actions_num_message[] = "Optional. Number of first K students. If this parameter is positive,"\
-"the demo detects first K persons with the action, pointed by the parameter 'top_id'";
-
-/// @brief Message crop gallery
+static const char target_actions_num_message[] = "Optional. Number of first K students. If this parameter is positive,"
+                                                 "the demo detects first K persons with the action, pointed by the parameter 'top_id'";
 static const char crop_gallery_message[] = "Optional. Crop images during faces gallery creation.";
-
-/// @brief Message for probability threshold argument for face detections during database registration.
 static const char face_threshold_registration_output_message[] = "Optional. Probability threshold for face detections during database registration.";
-
-/// @brief Message for minumum input size for faces database registration.
 static const char min_size_fr_reg_output_message[] = "Optional. Minimum input size for faces during database registration.";
-
-/// @brief Message action statistics output flag
 static const char act_det_output_message[] = "Optional. Output file name to save per-person action detections in.";
-
-/// @brief Message for number of frames for action tracker
 static const char tracker_smooth_size_message[] = "Optional. Number of frames to smooth actions.";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
 
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "cam", video_message);
-
-/// @brief Define parameter for person/action detection model file <br>
-/// It is a required parameter
 DEFINE_string(m_act, "", person_action_detection_model_message);
-
-/// @brief Define parameter for face detection model file <br>
-/// It is a required parameter
 DEFINE_string(m_fd, "", face_detection_model_message);
-
-/// @brief Define parameter for facial landmarks model file <br>
-/// It is a required parameter
 DEFINE_string(m_lm, "", facial_landmarks_model_message);
-
-/// @brief Define parameter for face reidentification model file <br>
-/// It is a required parameter
 DEFINE_string(m_reid, "", face_reid_model_message);
-
-/// @brief device the target device for person/action detection infer on <br>
 DEFINE_string(d_act, "CPU", target_device_message_action_detection);
-
-/// @brief device the target device for face detection on <br>
 DEFINE_string(d_fd, "CPU", target_device_message_face_detection);
-
-/// @brief device the target device for facial landnmarks regression infer on <br>
 DEFINE_string(d_lm, "CPU", target_device_message_landmarks_regression);
-
-/// @brief device the target device for face reidentification infer on <br>
 DEFINE_string(d_reid, "CPU", target_device_message_face_reid);
-
-/// @brief Enable per-layer performance report
+DEFINE_bool(greedy_reid_matching, false, greedy_reid_matching_message);
 DEFINE_bool(pc, false, performance_counter_message);
-
-/// @brief clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Output file name to save per-person action statistics in.
-/// It is an optional parameter
 DEFINE_string(ad, "", act_stat_output_message);
-
-/// @brief Flag to output raw pipeline results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
-
-/// @brief Define probability threshold for person/action detection <br>
-/// It is an optional parameter
 DEFINE_double(t_ad, 0.3, person_threshold_output_message);
-
-/// @brief Define probability threshold for action recognition <br>
-/// It is an optional parameter
 DEFINE_double(t_ar, 0.75, action_threshold_output_message);
-
-/// @brief Define probability threshold for face detections <br>
-/// It is an optional parameter
 DEFINE_double(t_fd, 0.6, face_threshold_output_message);
-
-/// @brief Define cosine distance threshold for face reid <br>
-/// It is an optional parameter
 DEFINE_double(t_reid, 0.7, threshold_output_message_face_reid);
-
-/// @brief Path to a faces gallery for reid <br>
-/// It is a optional parameter
 DEFINE_string(fg, "", reid_gallery_path_message);
-
-/// @brief File to write output video with visualization to.
-/// It is a optional parameter
 DEFINE_string(out_v, "", output_video_message);
-
-/// @brief Flag to disable processed video showing<br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_processed_video);
-
-/// @brief Input image height for face detector<br>
-/// It is an optional parameter
 DEFINE_int32(inh_fd, 600, input_image_height_output_message);
-
-/// @brief Input image width for face detector<br>
-/// It is an optional parameter
 DEFINE_int32(inw_fd, 600, input_image_width_output_message);
-
-/// @brief Expand ratio for bbox before face recognition<br>
-/// It is an optional parameter
 DEFINE_double(exp_r_fd, 1.15, face_threshold_output_message);
-
-/// @brief Input image height for face detector<br>
-/// It is an optional parameter
 DEFINE_int32(last_frame, -1, last_frame_message);
-
-/// @brief Label of teacher<br>
-/// It is an optional parameter
 DEFINE_string(teacher_id, "", teacher_id_message);
-
-/// @brief Min action duration<br>
-/// It is an optional parameter
 DEFINE_double(min_ad, 1.0, min_action_duration_message);
-
-/// @brief Same action time delta<br>
-/// It is an optional parameter
 DEFINE_double(d_ad, 1.0, same_action_time_delta_message);
-
-/// @brief Labels of student actions<br>
-/// It is an optional parameter
 DEFINE_string(student_ac, "sitting,standing,raising_hand", student_actions_message);
-
-/// @brief Labels of student actions for top-k mode<br>
-/// It is an optional parameter
 DEFINE_string(top_ac, "sitting,raising_hand", top_actions_message);
-
-/// @brief Labels of teacher actions<br>
-/// It is an optional parameter
 DEFINE_string(teacher_ac, "standing,writing,demonstrating", teacher_actions_message);
-
-/// @brief Define target action name for top-k mode <br>
-/// It is an optional parameter
 DEFINE_string(top_id, "raising_hand", target_action_name_message);
-
-/// @brief Define maximal number of target actions <br>
-/// It is an optional parameter
 DEFINE_int32(a_top, -1, target_actions_num_message);
-
-/// @brief Flag to enable image cropping during database creation<br>
-/// It is an optional parameter
 DEFINE_bool(crop_gallery, false, crop_gallery_message);
-
-/// @brief Define probability threshold for face detections during registration<br>
-/// It is an optional parameter
 DEFINE_double(t_reg_fd, 0.9, face_threshold_registration_output_message);
-
-/// @brief Minimum input image width & heigh for sucessful face registration<br>
-/// It is an optional parameter
 DEFINE_int32(min_size_fr, 128, min_size_fr_reg_output_message);
-
-/// @brief Output file name to save per-person action detections in.
-/// It is an optional parameter
 DEFINE_string(al, "", act_det_output_message);
-
-/// @brief Number of frames to smooth actions<br>
-/// It is an optional parameter
 DEFINE_int32(ss_t, -1, tracker_smooth_size_message);
+DEFINE_string(u, "", utilization_monitors_message);
 
 /**
 * @brief This function show a help message
@@ -307,6 +130,7 @@ static void showUsage() {
     std::cout << "    -d_lm '<device>'               " << target_device_message_landmarks_regression << std::endl;
     std::cout << "    -d_reid '<device>'             " << target_device_message_face_reid << std::endl;
     std::cout << "    -out_v  '<path>'               " << output_video_message << std::endl;
+    std::cout << "    -greedy_reid_matching          " << greedy_reid_matching_message << std::endl;
     std::cout << "    -pc                            " << performance_counter_message << std::endl;
     std::cout << "    -r                             " << raw_output_message << std::endl;
     std::cout << "    -ad                            " << act_stat_output_message << std::endl;
@@ -333,4 +157,5 @@ static void showUsage() {
     std::cout << "    -min_size_fr                   " << min_size_fr_reg_output_message << std::endl;
     std::cout << "    -al                            " << act_det_output_message << std::endl;
     std::cout << "    -ss_t                          " << tracker_smooth_size_message << std::endl;
+    std::cout << "    -u                             " << utilization_monitors_message << std::endl;
 }
diff --git a/demos/smart_classroom_demo/include/tracker.hpp b/demos/smart_classroom_demo/include/tracker.hpp
index b93344cca3d..62f4fb45f23 100644
--- a/demos/smart_classroom_demo/include/tracker.hpp
+++ b/demos/smart_classroom_demo/include/tracker.hpp
@@ -40,7 +40,10 @@ using TrackedObjects = std::vector<TrackedObject>;
 ///
 class KuhnMunkres {
 public:
-    KuhnMunkres();
+    ///
+    /// \brief Initializes the class for assignment problem solving.
+    /// \param[in] greedy If a faster greedy matching algorithm should be used.
+    explicit KuhnMunkres(bool greedy = false);
 
     ///
     /// \brief Solves the assignment problem for given dissimilarity matrix.
@@ -180,7 +183,6 @@ class Tracker {
     explicit Tracker(const TrackerParams &params = TrackerParams())
         : params_(params),
           tracks_counter_(0),
-          valid_tracks_counter_(0),
           frame_size_() {}
 
     ///
@@ -210,12 +212,6 @@ class Tracker {
     ///
     void Reset();
 
-    ///
-    /// \brief Returns number of counted tracks.
-    /// \return a number of counted tracks.
-    ///
-    size_t Count() const;
-
     ///
     /// \brief Returns recently detected objects.
     /// \return recently detected objects.
@@ -275,8 +271,6 @@ class Tracker {
     void DropForgottenTracks();
 
 private:
-    void DropForgottenTrack(size_t track_id);
-
     const std::set<size_t> &active_track_ids() const { return active_track_ids_; }
 
     float ShapeAffinity(const cv::Rect &trk, const cv::Rect &det);
@@ -332,9 +326,6 @@ class Tracker {
     // Number of all current tracks.
     size_t tracks_counter_;
 
-    // Number of dropped valid tracks.
-    size_t valid_tracks_counter_;
-
     cv::Size frame_size_;
 };
 
diff --git a/demos/smart_classroom_demo/main.cpp b/demos/smart_classroom_demo/main.cpp
index 1f2326d2ea1..95a08f5949c 100644
--- a/demos/smart_classroom_demo/main.cpp
+++ b/demos/smart_classroom_demo/main.cpp
@@ -5,11 +5,9 @@
 #include <chrono>  // NOLINT
 
 #include <gflags/gflags.h>
+#include <monitors/presenter.h>
 #include <samples/ocv_common.hpp>
 #include <samples/slog.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 #include <string>
 #include <memory>
 #include <limits>
@@ -169,7 +167,7 @@ class Visualizer {
         if (enabled_ && !writer_.isOpened()) {
             cv::putText(frame_,
                         std::to_string(static_cast<int>(fps)) + " fps",
-                        cv::Point(10, 50), cv::FONT_HERSHEY_SIMPLEX, 2,
+                        cv::Point(10, 50), cv::FONT_HERSHEY_SIMPLEX, 1,
                         color, 2, cv::LINE_AA);
         }
     }
@@ -206,7 +204,7 @@ class Visualizer {
             const int text_shift = (crop_width_ - label_size.width) / 2;
             cv::putText(top_persons_, label_to_draw,
                         cv::Point(shift + text_shift, label_size.height + baseLine / 2),
-                        cv::FONT_HERSHEY_SIMPLEX, 2, cv::Scalar(0, 255, 0), 2, cv::LINE_AA);
+                        cv::FONT_HERSHEY_SIMPLEX, 1, cv::Scalar(0, 255, 0), 2, cv::LINE_AA);
         }
 
         cv::imshow(top_window_name_, top_persons_);
@@ -351,10 +349,10 @@ std::string GetActionTextLabel(const unsigned label, const std::vector<std::stri
 }
 
 cv::Scalar GetActionTextColor(const unsigned label) {
-    static std::vector<cv::Scalar> actions_map = {
+    static const cv::Scalar label_colors[] = {
         cv::Scalar(0, 255, 0), cv::Scalar(255, 0, 0), cv::Scalar(0, 0, 255), cv::Scalar(0, 255, 255)};
-    if (label < actions_map.size()) {
-        return actions_map[label];
+    if (label < arraySize(label_colors)) {
+        return label_colors[label];
     }
     return cv::Scalar(0, 0, 0);
 }
@@ -424,13 +422,107 @@ bool checkDynamicBatchSupport(const Core& ie, const std::string& device)  {
         if (ie.GetConfig(device, CONFIG_KEY(DYN_BATCH_ENABLED)).as<std::string>() != PluginConfigParams::YES)
             return false;
     }
-    catch(const std::exception& error)  {
+    catch(const std::exception&)  {
         return false;
     }
     return true;
 }
 
-}  // namespace
+class FaceRecognizer {
+public:
+    virtual ~FaceRecognizer() = default;
+
+    virtual bool LabelExists(const std::string &label) const = 0;
+    virtual std::string GetLabelByID(int id) const = 0;
+    virtual std::vector<std::string> GetIDToLabelMap() const = 0;
+
+    virtual std::vector<int> Recognize(const cv::Mat& frame, const detection::DetectedObjects& faces) = 0;
+
+    virtual void PrintPerformanceCounts(
+        const std::string &landmarks_device, const std::string &reid_device) = 0;
+};
+
+class FaceRecognizerNull : public FaceRecognizer {
+public:
+    bool LabelExists(const std::string &) const override { return false; }
+
+    std::string GetLabelByID(int) const override {
+        return EmbeddingsGallery::unknown_label;
+    }
+
+    std::vector<std::string> GetIDToLabelMap() const override { return {}; }
+
+    std::vector<int> Recognize(const cv::Mat&, const detection::DetectedObjects& faces) override {
+        return std::vector<int>(faces.size(), EmbeddingsGallery::unknown_id);
+    }
+
+    void PrintPerformanceCounts(
+        const std::string &, const std::string &) override {}
+};
+
+class FaceRecognizerDefault : public FaceRecognizer {
+public:
+    FaceRecognizerDefault(
+            const CnnConfig& landmarks_detector_config,
+            const CnnConfig& reid_config,
+            const detection::DetectorConfig& face_registration_det_config,
+            const std::string& face_gallery_path,
+            double reid_threshold,
+            int min_size_fr,
+            bool crop_gallery,
+            bool greedy_reid_matching
+    )
+        : landmarks_detector(landmarks_detector_config),
+          face_reid(reid_config),
+          face_gallery(face_gallery_path, reid_threshold, min_size_fr, crop_gallery,
+                       face_registration_det_config, landmarks_detector, face_reid,
+                       greedy_reid_matching)
+    {
+        if (face_gallery.size() == 0) {
+            slog::warn << "Face reid gallery is empty!" << slog::endl;
+        } else {
+            slog::info << "Face reid gallery size: " << face_gallery.size() << slog::endl;
+        }
+    }
+
+    bool LabelExists(const std::string &label) const override {
+        return face_gallery.LabelExists(label);
+    }
+
+    std::string GetLabelByID(int id) const override {
+        return face_gallery.GetLabelByID(id);
+    }
+
+    std::vector<std::string> GetIDToLabelMap() const override {
+        return face_gallery.GetIDToLabelMap();
+    }
+
+    std::vector<int> Recognize(const cv::Mat& frame, const detection::DetectedObjects& faces) override {
+        std::vector<cv::Mat> face_rois;
+
+        for (const auto& face : faces) {
+            face_rois.push_back(frame(face.rect));
+        }
+
+        std::vector<cv::Mat> landmarks, embeddings;
+
+        landmarks_detector.Compute(face_rois, &landmarks, cv::Size(2, 5));
+        AlignFaces(&face_rois, &landmarks);
+        face_reid.Compute(face_rois, &embeddings);
+        return face_gallery.GetIDsByEmbeddings(embeddings);
+    }
+
+    void PrintPerformanceCounts(
+            const std::string &landmarks_device, const std::string &reid_device) {
+        landmarks_detector.PrintPerformanceCounts(landmarks_device);
+        face_reid.PrintPerformanceCounts(reid_device);
+    }
+
+private:
+    VectorCNN landmarks_detector;
+    VectorCNN face_reid;
+    EmbeddingsGallery face_gallery;
+};
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
     // ---------------------------Parsing and validation of input args--------------------------------------
@@ -454,6 +546,7 @@ bool ParseAndCheckCommandLine(int argc, char *argv[]) {
     return true;
 }
 
+}  // namespace
 
 int main(int argc, char* argv[]) {
     try {
@@ -466,13 +559,9 @@ int main(int argc, char* argv[]) {
 
         const auto video_path = FLAGS_i;
         const auto ad_model_path = FLAGS_m_act;
-        const auto ad_weights_path = fileNameNoExt(FLAGS_m_act) + ".bin";
         const auto fd_model_path = FLAGS_m_fd;
-        const auto fd_weights_path = fileNameNoExt(FLAGS_m_fd) + ".bin";
         const auto fr_model_path = FLAGS_m_reid;
-        const auto fr_weights_path = fileNameNoExt(FLAGS_m_reid) + ".bin";
         const auto lm_model_path = FLAGS_m_lm;
-        const auto lm_weights_path = fileNameNoExt(FLAGS_m_lm) + ".bin";
         const auto teacher_id = FLAGS_teacher_id;
 
         if (!FLAGS_teacher_id.empty() && !FLAGS_top_id.empty()) {
@@ -522,10 +611,6 @@ int main(int argc, char* argv[]) {
 
             /** Load extensions for the CPU device **/
             if ((device.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-                ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
-
                 if (!FLAGS_l.empty()) {
                     // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
                     auto extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -549,79 +634,84 @@ int main(int argc, char* argv[]) {
             loadedDevices.insert(device);
         }
 
-        // Load action detector
-        ActionDetectorConfig action_config(ad_model_path, ad_weights_path);
-        action_config.deviceName = FLAGS_d_act;
-        action_config.ie = ie;
-        action_config.is_async = true;
-        action_config.enabled = !ad_model_path.empty();
-        action_config.detection_confidence_threshold = static_cast<float>(FLAGS_t_ad);
-        action_config.action_confidence_threshold = static_cast<float>(FLAGS_t_ar);
-        action_config.num_action_classes = actions_map.size();
-        ActionDetection action_detector(action_config);
-
-        // Load face detector
-        detection::DetectorConfig face_config(fd_model_path, fd_weights_path);
-        face_config.deviceName = FLAGS_d_fd;
-        face_config.ie = ie;
-        face_config.is_async = true;
-        face_config.enabled = !fd_model_path.empty();
-        face_config.confidence_threshold = static_cast<float>(FLAGS_t_fd);
-        face_config.input_h = FLAGS_inh_fd;
-        face_config.input_w = FLAGS_inw_fd;
-        face_config.increase_scale_x = static_cast<float>(FLAGS_exp_r_fd);
-        face_config.increase_scale_y = static_cast<float>(FLAGS_exp_r_fd);
-        detection::FaceDetection face_detector(face_config);
-
-        // Load face detector for face database registration
-        detection::DetectorConfig face_registration_det_config(fd_model_path, fd_weights_path);
-        face_registration_det_config.deviceName = FLAGS_d_fd;
-        face_registration_det_config.ie = ie;
-        face_registration_det_config.enabled = !fd_model_path.empty();
-        face_registration_det_config.is_async = false;
-        face_registration_det_config.confidence_threshold = static_cast<float>(FLAGS_t_reg_fd);
-        face_registration_det_config.increase_scale_x = static_cast<float>(FLAGS_exp_r_fd);
-        face_registration_det_config.increase_scale_y = static_cast<float>(FLAGS_exp_r_fd);
-        detection::FaceDetection face_detector_for_registration(face_registration_det_config);
-
-        // Load face reid
-        CnnConfig reid_config(fr_model_path, fr_weights_path);
-        reid_config.enabled = face_config.enabled && !fr_model_path.empty() && !lm_model_path.empty();
-        reid_config.deviceName = FLAGS_d_reid;
-        if (checkDynamicBatchSupport(ie, FLAGS_d_reid))
-            reid_config.max_batch_size = 16;
-        else
-            reid_config.max_batch_size = 1;
-        reid_config.ie = ie;
-        VectorCNN face_reid(reid_config);
-
-        // Load landmarks detector
-        CnnConfig landmarks_config(lm_model_path, lm_weights_path);
-        landmarks_config.max_batch_size = 16;
-        landmarks_config.enabled = face_config.enabled && reid_config.enabled && !lm_model_path.empty();
-        landmarks_config.deviceName = FLAGS_d_lm;
-        if (checkDynamicBatchSupport(ie, FLAGS_d_lm))
-            landmarks_config.max_batch_size = 16;
-        else
-            landmarks_config.max_batch_size = 1;
-        landmarks_config.ie = ie;
-        VectorCNN landmarks_detector(landmarks_config);
-
-        // Create face gallery
-        EmbeddingsGallery face_gallery(FLAGS_fg, FLAGS_t_reid, FLAGS_min_size_fr, FLAGS_crop_gallery,
-                                       face_detector_for_registration, landmarks_detector, face_reid);
-
-        if (!reid_config.enabled) {
-            slog::warn << "Face recognition models are disabled!"  << slog::endl;
-        } else if (!face_gallery.size()) {
-            slog::warn << "Face reid gallery is empty!"  << slog::endl;
+        std::unique_ptr<AsyncDetection<DetectedAction>> action_detector;
+        if (!ad_model_path.empty()) {
+            // Load action detector
+            ActionDetectorConfig action_config(ad_model_path);
+            action_config.deviceName = FLAGS_d_act;
+            action_config.ie = ie;
+            action_config.is_async = true;
+            action_config.detection_confidence_threshold = static_cast<float>(FLAGS_t_ad);
+            action_config.action_confidence_threshold = static_cast<float>(FLAGS_t_ar);
+            action_config.num_action_classes = actions_map.size();
+            action_detector.reset(new ActionDetection(action_config));
         } else {
-            slog::info << "Face reid gallery size: " << face_gallery.size() << slog::endl;
+            action_detector.reset(new NullDetection<DetectedAction>);
         }
 
-        if (actions_type == TEACHER && !face_gallery.LabelExists(teacher_id)) {
-            slog::err << "Teacher id does not exist in the gallery!"  << slog::endl;
-            return 1;
+        std::unique_ptr<AsyncDetection<detection::DetectedObject>> face_detector;
+        if (!fd_model_path.empty()) {
+            // Load face detector
+            detection::DetectorConfig face_config(fd_model_path);
+            face_config.deviceName = FLAGS_d_fd;
+            face_config.ie = ie;
+            face_config.is_async = true;
+            face_config.confidence_threshold = static_cast<float>(FLAGS_t_fd);
+            face_config.input_h = FLAGS_inh_fd;
+            face_config.input_w = FLAGS_inw_fd;
+            face_config.increase_scale_x = static_cast<float>(FLAGS_exp_r_fd);
+            face_config.increase_scale_y = static_cast<float>(FLAGS_exp_r_fd);
+            face_detector.reset(new detection::FaceDetection(face_config));
+        } else {
+            face_detector.reset(new NullDetection<detection::DetectedObject>);
+        }
+
+        std::unique_ptr<FaceRecognizer> face_recognizer;
+
+        if (!fd_model_path.empty() && !fr_model_path.empty() && !lm_model_path.empty()) {
+            // Create face recognizer
+
+            detection::DetectorConfig face_registration_det_config(fd_model_path);
+            face_registration_det_config.deviceName = FLAGS_d_fd;
+            face_registration_det_config.ie = ie;
+            face_registration_det_config.is_async = false;
+            face_registration_det_config.confidence_threshold = static_cast<float>(FLAGS_t_reg_fd);
+            face_registration_det_config.increase_scale_x = static_cast<float>(FLAGS_exp_r_fd);
+            face_registration_det_config.increase_scale_y = static_cast<float>(FLAGS_exp_r_fd);
+
+            CnnConfig reid_config(fr_model_path);
+            reid_config.deviceName = FLAGS_d_reid;
+            if (checkDynamicBatchSupport(ie, FLAGS_d_reid))
+                reid_config.max_batch_size = 16;
+            else
+                reid_config.max_batch_size = 1;
+            reid_config.ie = ie;
+
+            CnnConfig landmarks_config(lm_model_path);
+            landmarks_config.deviceName = FLAGS_d_lm;
+            if (checkDynamicBatchSupport(ie, FLAGS_d_lm))
+                landmarks_config.max_batch_size = 16;
+            else
+                landmarks_config.max_batch_size = 1;
+            landmarks_config.ie = ie;
+
+            face_recognizer.reset(new FaceRecognizerDefault(
+                landmarks_config, reid_config,
+                face_registration_det_config,
+                FLAGS_fg, FLAGS_t_reid, FLAGS_min_size_fr, FLAGS_crop_gallery, FLAGS_greedy_reid_matching));
+
+            if (actions_type == TEACHER && !face_recognizer->LabelExists(teacher_id)) {
+                slog::err << "Teacher id does not exist in the gallery!" << slog::endl;
+                return 1;
+            }
+        } else {
+            slog::warn << "Face recognition models are disabled!" << slog::endl;
+            if (actions_type == TEACHER) {
+                slog::err << "Face recognition must be enabled to recognize teacher actions." << slog::endl;
+                return 1;
+            }
+
+            face_recognizer.reset(new FaceRecognizerNull);
         }
 
         // Create tracker for reid
@@ -655,8 +745,6 @@ int main(int argc, char* argv[]) {
         Tracker tracker_action(tracker_action_params);
 
         cv::Mat frame, prev_frame;
-        DetectedActions actions;
-        detection::DetectedObjects faces;
 
         float work_time_ms = 0.f;
         float wait_time_ms = 0.f;
@@ -681,10 +769,10 @@ int main(int argc, char* argv[]) {
         }
 
         if (actions_type != TOP_K) {
-            action_detector.enqueue(frame);
-            action_detector.submitRequest();
-            face_detector.enqueue(frame);
-            face_detector.submitRequest();
+            action_detector->enqueue(frame);
+            action_detector->submitRequest();
+            face_detector->enqueue(frame);
+            face_detector->submitRequest();
         }
 
         prev_frame = frame.clone();
@@ -710,6 +798,9 @@ int main(int argc, char* argv[]) {
         }
         std::cout << std::endl;
 
+        cv::Size graphSize{static_cast<int>(frame.cols / 4), 60};
+        Presenter presenter(FLAGS_u, frame.rows - graphSize.height - 10, graphSize);
+
         while (!is_last_frame) {
             logger.CreateNextFrameRecord(cap.GetVideoPath(), work_num_frames, prev_frame.cols, prev_frame.rows);
             auto started = std::chrono::high_resolution_clock::now();
@@ -722,6 +813,9 @@ int main(int argc, char* argv[]) {
             if (key == ESC_KEY) {
                 break;
             }
+            presenter.handleKey(key);
+
+            presenter.drawGraphs(prev_frame);
 
             sc_visualizer.SetFrame(prev_frame);
 
@@ -729,8 +823,8 @@ int main(int argc, char* argv[]) {
                 if ( (is_monitoring_enabled && key == SPACE_KEY) ||
                      (!is_monitoring_enabled && key != SPACE_KEY) ) {
                     if (key == SPACE_KEY) {
-                        action_detector.wait();
-                        action_detector.fetchResults();
+                        action_detector->wait();
+                        action_detector->fetchResults();
 
                         tracker_action.Reset();
                         top_k_obj_ids.clear();
@@ -752,18 +846,17 @@ int main(int argc, char* argv[]) {
                     if (key == SPACE_KEY) {
                         is_monitoring_enabled = true;
 
-                        action_detector.enqueue(prev_frame);
-                        action_detector.submitRequest();
+                        action_detector->enqueue(prev_frame);
+                        action_detector->submitRequest();
                     }
 
-                    action_detector.wait();
-                    action_detector.fetchResults();
-                    actions = action_detector.results;
+                    action_detector->wait();
+                    DetectedActions actions = action_detector->fetchResults();
 
                     if (!is_last_frame) {
                         prev_frame_path = cap.GetVideoPath();
-                        action_detector.enqueue(frame);
-                        action_detector.submitRequest();
+                        action_detector->enqueue(frame);
+                        action_detector->submitRequest();
                     }
 
                     TrackedObjects tracked_action_objects;
@@ -811,36 +904,26 @@ int main(int argc, char* argv[]) {
                     }
                 }
             } else {
-                face_detector.wait();
-                face_detector.fetchResults();
-                faces = face_detector.results;
+                face_detector->wait();
+                detection::DetectedObjects faces = face_detector->fetchResults();
 
-                action_detector.wait();
-                action_detector.fetchResults();
-                actions = action_detector.results;
+                action_detector->wait();
+                DetectedActions actions = action_detector->fetchResults();
 
                 if (!is_last_frame) {
                     prev_frame_path = cap.GetVideoPath();
-                    face_detector.enqueue(frame);
-                    face_detector.submitRequest();
-                    action_detector.enqueue(frame);
-                    action_detector.submitRequest();
+                    face_detector->enqueue(frame);
+                    face_detector->submitRequest();
+                    action_detector->enqueue(frame);
+                    action_detector->submitRequest();
                 }
 
-                std::vector<cv::Mat> face_rois, landmarks, embeddings;
-                TrackedObjects tracked_face_objects;
+                auto ids = face_recognizer->Recognize(prev_frame, faces);
 
-                for (const auto& face : faces) {
-                    face_rois.push_back(prev_frame(face.rect));
-                }
-                landmarks_detector.Compute(face_rois, &landmarks, cv::Size(2, 5));
-                AlignFaces(&face_rois, &landmarks);
-                face_reid.Compute(face_rois, &embeddings);
-                auto ids = face_gallery.GetIDsByEmbeddings(embeddings);
+                TrackedObjects tracked_face_objects;
 
                 for (size_t i = 0; i < faces.size(); i++) {
-                    int label = ids.empty() ? EmbeddingsGallery::unknown_id : ids[i];
-                    tracked_face_objects.emplace_back(faces[i].rect, faces[i].confidence, label);
+                    tracked_face_objects.emplace_back(faces[i].rect, faces[i].confidence, ids[i]);
                 }
                 tracker_reid.Process(prev_frame, tracked_face_objects, work_num_frames);
 
@@ -863,9 +946,11 @@ int main(int argc, char* argv[]) {
                 std::map<int, int> frame_face_obj_id_to_action;
                 for (size_t j = 0; j < tracked_faces.size(); j++) {
                     const auto& face = tracked_faces[j];
+                    std::string face_label = face_recognizer->GetLabelByID(face.label);
+
                     std::string label_to_draw;
                     if (face.label != EmbeddingsGallery::unknown_id)
-                        label_to_draw += face_gallery.GetLabelByID(face.label);
+                        label_to_draw += face_label;
 
                     int person_ind = GetIndexOfTheNearestPerson(face, tracked_actions);
                     int action_ind = default_action_index;
@@ -879,11 +964,11 @@ int main(int argc, char* argv[]) {
                         }
                         frame_face_obj_id_to_action[face.object_id] = action_ind;
                         sc_visualizer.DrawObject(face.rect, label_to_draw, red_color, white_color, true);
-                        logger.AddFaceToFrame(face.rect, face_gallery.GetLabelByID(face.label), "");
+                        logger.AddFaceToFrame(face.rect, face_label, "");
                     }
 
                     if ((actions_type == TEACHER) && (person_ind >= 0)) {
-                        if (face_gallery.GetLabelByID(face.label) == teacher_id) {
+                        if (face_label == teacher_id) {
                             teacher_track_id = tracked_actions[person_ind].object_id;
                         } else if (teacher_track_id == tracked_actions[person_ind].object_id) {
                             teacher_track_id = -1;
@@ -895,7 +980,7 @@ int main(int argc, char* argv[]) {
                     for (const auto& action : tracked_actions) {
                         const auto& action_label = GetActionTextLabel(action.label, actions_map);
                         const auto& action_color = GetActionTextColor(action.label);
-                        const auto& text_label = face_config.enabled ? "" : action_label;
+                        const auto& text_label = fd_model_path.empty() ? action_label : "";
                         sc_visualizer.DrawObject(action.rect, text_label, action_color, white_color, true);
                         logger.AddPersonToFrame(action.rect, action_label, "");
                         logger.AddDetectionToFrame(action, work_num_frames);
@@ -938,12 +1023,13 @@ int main(int argc, char* argv[]) {
         slog::info << "Frames processed: " << total_num_frames << slog::endl;
         if (FLAGS_pc) {
             std::map<std::string, std::string>  mapDevices = getMapFullDevicesNames(ie, devices);
-            face_detector.wait();
-            action_detector.wait();
-            action_detector.PrintPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_act));
-            face_detector.PrintPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_fd));
-            face_reid.PrintPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_reid));
-            landmarks_detector.PrintPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_lm));
+            face_detector->wait();
+            action_detector->wait();
+            action_detector->printPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_act));
+            face_detector->printPerformanceCounts(getFullDeviceName(mapDevices, FLAGS_d_fd));
+            face_recognizer->PrintPerformanceCounts(
+                getFullDeviceName(mapDevices, FLAGS_d_lm),
+                getFullDeviceName(mapDevices, FLAGS_d_reid));
         }
 
         if (actions_type == STUDENT) {
@@ -953,7 +1039,9 @@ int main(int argc, char* argv[]) {
             std::vector<Track> new_face_tracks = UpdateTrackLabelsToBestAndFilterOutUnknowns(face_tracks);
             std::map<int, int> face_track_id_to_label = GetMapFaceTrackIdToLabel(new_face_tracks);
 
-            if (reid_config.enabled && face_gallery.size() > 0) {
+            std::vector<std::string> face_id_to_label_map = face_recognizer->GetIDToLabelMap();
+
+            if (!face_id_to_label_map.empty()) {
                 std::map<int, FrameEventsTrack> face_obj_id_to_actions_track;
                 ConvertActionMapsToFrameEventTracks(face_obj_id_to_action_maps, default_action_index,
                                                     &face_obj_id_to_actions_track);
@@ -968,7 +1056,7 @@ int main(int argc, char* argv[]) {
                 slog::info << "Final ID->events mapping" << slog::endl;
                 logger.DumpTracks(face_obj_id_to_events,
                                   actions_map, face_track_id_to_label,
-                                  face_gallery.GetIDToLabelMap());
+                                  face_id_to_label_map);
 
                 std::vector<std::map<int, int>> face_obj_id_to_smoothed_action_maps;
                 ConvertRangeEventsTracksToActionMaps(end_frame, face_obj_id_to_events,
@@ -978,10 +1066,12 @@ int main(int argc, char* argv[]) {
                 logger.DumpDetections(cap.GetVideoPath(), frame.size(), work_num_frames,
                                       new_face_tracks,
                                       face_track_id_to_label,
-                                      actions_map, face_gallery.GetIDToLabelMap(),
+                                      actions_map, face_id_to_label_map,
                                       face_obj_id_to_smoothed_action_maps);
             }
         }
+
+        std::cout << presenter.reportMeans() << '\n';
     }
     catch (const std::exception& error) {
         slog::err << error.what() << slog::endl;
diff --git a/demos/smart_classroom_demo/src/action_detector.cpp b/demos/smart_classroom_demo/src/action_detector.cpp
index b7e2c413749..356e8e5088a 100644
--- a/demos/smart_classroom_demo/src/action_detector.cpp
+++ b/demos/smart_classroom_demo/src/action_detector.cpp
@@ -27,14 +27,10 @@ bool SortScorePairDescend(const std::pair<float, T>& pair1,
 void ActionDetection::submitRequest() {
     if (!enqueued_frames_) return;
     enqueued_frames_ = 0;
-    results_fetched_ = false;
-    results.clear();
     BaseCnnDetection::submitRequest();
 }
 
 void ActionDetection::enqueue(const cv::Mat &frame) {
-    if (!enabled()) return;
-
     if (!request) {
         request = net_.CreateInferRequestPtr();
     }
@@ -50,80 +46,77 @@ void ActionDetection::enqueue(const cv::Mat &frame) {
 }
 
 ActionDetection::ActionDetection(const ActionDetectorConfig& config)
-    : BaseCnnDetection(config.enabled, config.is_async), config_(config) {
-    if (config.enabled) {
-        topoName = "action detector";
-        CNNNetReader net_reader;
-        net_reader.ReadNetwork(config.path_to_model);
-        net_reader.ReadWeights(config.path_to_weights);
-        if (!net_reader.isParseSuccess()) {
-            THROW_IE_EXCEPTION << "Cannot load model";
-        }
-
-        net_reader.getNetwork().setBatchSize(config.max_batch_size);
-
-        InputsDataMap inputInfo(net_reader.getNetwork().getInputsInfo());
-        if (inputInfo.size() != 1) {
-            THROW_IE_EXCEPTION << "Action Detection network should have only one input";
-        }
-        InputInfo::Ptr inputInfoFirst = inputInfo.begin()->second;
-        inputInfoFirst->setPrecision(Precision::U8);
-        inputInfoFirst->getInputData()->setLayout(Layout::NCHW);
-
-        network_input_size_.height = inputInfoFirst->getTensorDesc().getDims()[2];
-        network_input_size_.width = inputInfoFirst->getTensorDesc().getDims()[3];
-
-        OutputsDataMap outputInfo(net_reader.getNetwork().getOutputsInfo());
-
-        for (auto&& item : outputInfo) {
-            item.second->setPrecision(Precision::FP32);
-            item.second->setLayout(InferenceEngine::TensorDesc::getLayoutByDims(item.second->getDims()));
-        }
-
-        new_network_ = outputInfo.find(config_.new_loc_blob_name) != outputInfo.end();
-        input_name_ = inputInfo.begin()->first;
-        net_ = config_.ie.LoadNetwork(net_reader.getNetwork(), config_.deviceName);
+        : BaseCnnDetection(config.is_async), config_(config) {
+    topoName = "action detector";
+    auto network = config.ie.ReadNetwork(config.path_to_model);
 
-        const auto& head_anchors = new_network_ ? config_.new_anchors : config_.old_anchors;
-        const int num_heads = head_anchors.size();
+    network.setBatchSize(config.max_batch_size);
 
-        head_ranges_.resize(num_heads + 1);
-        glob_anchor_map_.resize(num_heads);
-        head_step_sizes_.resize(num_heads);
-
-        num_glob_anchors_ = 0;
-        head_ranges_[0] = 0;
-        int head_shift = 0;
-        for (int head_id = 0; head_id < num_heads; ++head_id) {
-            glob_anchor_map_[head_id].resize(head_anchors[head_id]);
+    InputsDataMap inputInfo(network.getInputsInfo());
+    if (inputInfo.size() != 1) {
+        THROW_IE_EXCEPTION << "Action Detection network should have only one input";
+    }
+    InputInfo::Ptr inputInfoFirst = inputInfo.begin()->second;
+    inputInfoFirst->setPrecision(Precision::U8);
+    inputInfoFirst->getInputData()->setLayout(Layout::NCHW);
 
-            int anchor_height, anchor_width;
-            for (int anchor_id = 0; anchor_id < head_anchors[head_id]; ++anchor_id) {
-                const auto glob_anchor_name = new_network_
-                      ? config_.new_action_conf_blob_name_prefix + std::to_string(head_id + 1) +
-                        config_.new_action_conf_blob_name_suffix + std::to_string(anchor_id + 1)
-                      : config_.old_action_conf_blob_name_prefix + std::to_string(anchor_id + 1);
-                glob_anchor_names_.push_back(glob_anchor_name);
+    network_input_size_.height = inputInfoFirst->getTensorDesc().getDims()[2];
+    network_input_size_.width = inputInfoFirst->getTensorDesc().getDims()[3];
 
-                const auto anchor_dims = outputInfo[glob_anchor_name]->getDims();
-                anchor_height = new_network_ ? anchor_dims[2] : anchor_dims[1];
-                anchor_width = new_network_ ? anchor_dims[3] : anchor_dims[2];
+    OutputsDataMap outputInfo(network.getOutputsInfo());
 
-                const int anchor_size = anchor_height * anchor_width;
-                head_shift += anchor_size;
+    for (auto&& item : outputInfo) {
+        item.second->setPrecision(Precision::FP32);
+    }
 
-                head_step_sizes_[head_id] = new_network_ ? anchor_size : 1;
-                glob_anchor_map_[head_id][anchor_id] = num_glob_anchors_++;
+    new_network_ = outputInfo.find(config_.new_loc_blob_name) != outputInfo.end();
+    input_name_ = inputInfo.begin()->first;
+    net_ = config_.ie.LoadNetwork(network, config_.deviceName);
+
+    const auto& head_anchors = new_network_ ? config_.new_anchors : config_.old_anchors;
+    const int num_heads = head_anchors.size();
+
+    head_ranges_.resize(num_heads + 1);
+    glob_anchor_map_.resize(num_heads);
+    head_step_sizes_.resize(num_heads);
+
+    num_glob_anchors_ = 0;
+    head_ranges_[0] = 0;
+    int head_shift = 0;
+    for (int head_id = 0; head_id < num_heads; ++head_id) {
+        glob_anchor_map_[head_id].resize(head_anchors[head_id]);
+
+        int anchor_height, anchor_width;
+        for (int anchor_id = 0; anchor_id < head_anchors[head_id]; ++anchor_id) {
+            const auto glob_anchor_name = new_network_
+                  ? config_.new_action_conf_blob_name_prefix + std::to_string(head_id + 1) +
+                    config_.new_action_conf_blob_name_suffix + std::to_string(anchor_id + 1)
+                  : config_.old_action_conf_blob_name_prefix + std::to_string(anchor_id + 1);
+            glob_anchor_names_.push_back(glob_anchor_name);
+
+            const auto anchor_dims = outputInfo[glob_anchor_name]->getDims();
+            anchor_height = new_network_ ? anchor_dims[2] : anchor_dims[1];
+            anchor_width = new_network_ ? anchor_dims[3] : anchor_dims[2];
+            std::size_t action_dimention_idx = new_network_ ? 1 : 3;
+            if (anchor_dims[action_dimention_idx] != config_.num_action_classes) {
+                throw std::logic_error("The number of specified actions and the number of actions predicted by "
+                    "the Person/Action Detection Retail model must match");
             }
 
-            head_ranges_[head_id + 1] = head_shift;
-            head_blob_sizes_.emplace_back(anchor_width, anchor_height);
-        }
+            const int anchor_size = anchor_height * anchor_width;
+            head_shift += anchor_size;
 
-        num_candidates_ = head_shift;
+            head_step_sizes_[head_id] = new_network_ ? anchor_size : 1;
+            glob_anchor_map_[head_id][anchor_id] = num_glob_anchors_++;
+        }
 
-        binary_task_ = config_.num_action_classes == 2;
+        head_ranges_[head_id + 1] = head_shift;
+        head_blob_sizes_.emplace_back(anchor_width, anchor_height);
     }
+
+    num_candidates_ = head_shift;
+
+    binary_task_ = config_.num_action_classes == 2;
 }
 
 std::vector<int> ieSizeToVector(const SizeVector& ie_output_dims) {
@@ -134,13 +127,7 @@ std::vector<int> ieSizeToVector(const SizeVector& ie_output_dims) {
     return blob_sizes;
 }
 
-void ActionDetection::fetchResults() {
-    if (!enabled()) return;
-    results.clear();
-    if (results_fetched_) return;
-    results_fetched_ = true;
-
-
+DetectedActions ActionDetection::fetchResults() {
     const auto loc_blob_name = new_network_ ? config_.new_loc_blob_name : config_.old_loc_blob_name;
     const auto det_conf_blob_name = new_network_ ? config_.new_det_conf_blob_name : config_.old_det_conf_blob_name;
 
@@ -164,8 +151,8 @@ void ActionDetection::fetchResults() {
     }
 
     /** Parse detections **/
-    GetDetections(loc_out, main_conf_out, priorbox_out, add_conf_out,
-                  cv::Size(static_cast<int>(width_), static_cast<int>(height_)), &results);
+    return GetDetections(loc_out, main_conf_out, priorbox_out, add_conf_out,
+                         cv::Size(static_cast<int>(width_), static_cast<int>(height_)));
 }
 
 inline ActionDetection::NormalizedBBox
@@ -228,9 +215,9 @@ cv::Rect ActionDetection::ConvertToRect(
                     static_cast<int>((decoded_bbox_ymax - decoded_bbox_ymin) * frame_size.height));
 }
 
-void ActionDetection::GetDetections(const cv::Mat& loc, const cv::Mat& main_conf,
+DetectedActions ActionDetection::GetDetections(const cv::Mat& loc, const cv::Mat& main_conf,
         const cv::Mat& priorboxes, const std::vector<cv::Mat>& add_conf,
-        const cv::Size& frame_size, DetectedActions* detections) const {
+        const cv::Size& frame_size) const {
     /** Prepare input data buffers **/
     const float* loc_data = reinterpret_cast<float*>(loc.data);
     const float* det_conf_data = reinterpret_cast<float*>(main_conf.data);
@@ -279,7 +266,7 @@ void ActionDetection::GetDetections(const cv::Mat& loc, const cv::Mat& main_conf
         int action_label = -1;
         float action_max_exp_value = 0.f;
         float action_sum_exp_values = 0.f;
-        for (int c = 0; c < config_.num_action_classes; ++c) {
+        for (size_t c = 0; c < config_.num_action_classes; ++c) {
             float action_exp_value =
                 std::exp(scale * anchor_conf_data[action_conf_idx_shift + c * action_conf_step]);
             action_sum_exp_values += action_exp_value;
@@ -328,10 +315,11 @@ void ActionDetection::GetDetections(const cv::Mat& loc, const cv::Mat& main_conf
                           config_.detection_confidence_threshold,
                           &out_det_indices);
 
-    detections->clear();
+    DetectedActions detections;
     for (size_t i = 0; i < out_det_indices.size(); ++i) {
-        detections->emplace_back(valid_detections[out_det_indices[i]]);
+        detections.emplace_back(valid_detections[out_det_indices[i]]);
     }
+    return detections;
 }
 
 void ActionDetection::SoftNonMaxSuppression(const DetectedActions& detections,
diff --git a/demos/smart_classroom_demo/src/cnn.cpp b/demos/smart_classroom_demo/src/cnn.cpp
index f8c6690f339..cbecebd76d9 100644
--- a/demos/smart_classroom_demo/src/cnn.cpp
+++ b/demos/smart_classroom_demo/src/cnn.cpp
@@ -17,24 +17,15 @@ using namespace InferenceEngine;
 
 CnnDLSDKBase::CnnDLSDKBase(const Config& config) : config_(config) {}
 
-bool CnnDLSDKBase::Enabled() const {
-    return config_.enabled;
-}
-
 void CnnDLSDKBase::Load() {
-    CNNNetReader net_reader;
-    net_reader.ReadNetwork(config_.path_to_model);
-    net_reader.ReadWeights(config_.path_to_weights);
+    auto cnnNetwork = config_.ie.ReadNetwork(config_.path_to_model);
 
-    if (!net_reader.isParseSuccess()) {
-        THROW_IE_EXCEPTION << "Cannot load model";
-    }
 
-    const int currentBatchSize = net_reader.getNetwork().getBatchSize();
+    const int currentBatchSize = cnnNetwork.getBatchSize();
     if (currentBatchSize != config_.max_batch_size)
-        net_reader.getNetwork().setBatchSize(config_.max_batch_size);
+        cnnNetwork.setBatchSize(config_.max_batch_size);
 
-    InferenceEngine::InputsDataMap in = net_reader.getNetwork().getInputsInfo();
+    InferenceEngine::InputsDataMap in = cnnNetwork.getInputsInfo();
     if (in.size() != 1) {
         THROW_IE_EXCEPTION << "Network should have only one input";
     }
@@ -42,22 +33,19 @@ void CnnDLSDKBase::Load() {
     in.begin()->second->setLayout(Layout::NCHW);
     input_blob_name_ = in.begin()->first;
 
-    OutputsDataMap out = net_reader.getNetwork().getOutputsInfo();
+    OutputsDataMap out = cnnNetwork.getOutputsInfo();
     for (auto&& item : out) {
         item.second->setPrecision(Precision::FP32);
         output_blobs_names_.push_back(item.first);
     }
 
-    executable_network_ = config_.ie.LoadNetwork(net_reader.getNetwork(), config_.deviceName);
+    executable_network_ = config_.ie.LoadNetwork(cnnNetwork, config_.deviceName);
     infer_request_ = executable_network_.CreateInferRequest();
 }
 
 void CnnDLSDKBase::InferBatch(
         const std::vector<cv::Mat>& frames,
-        std::function<void(const InferenceEngine::BlobMap&, size_t)> fetch_results) const {
-    if (!config_.enabled) {
-        return;
-    }
+        const std::function<void(const InferenceEngine::BlobMap&, size_t)>& fetch_results) const {
     Blob::Ptr input = infer_request_.GetBlob(input_blob_name_);
     const size_t batch_size = input->getTensorDesc().getDims()[0];
 
@@ -81,25 +69,20 @@ void CnnDLSDKBase::InferBatch(
 }
 
 void CnnDLSDKBase::PrintPerformanceCounts(std::string fullDeviceName) const {
-    if (!config_.enabled) {
-        return;
-    }
     std::cout << "Performance counts for " << config_.path_to_model << std::endl << std::endl;
     ::printPerformanceCounts(infer_request_, std::cout, fullDeviceName, false);
 }
 
 void CnnDLSDKBase::Infer(const cv::Mat& frame,
-                         std::function<void(const InferenceEngine::BlobMap&, size_t)> fetch_results) const {
+                         const std::function<void(const InferenceEngine::BlobMap&, size_t)>& fetch_results) const {
     InferBatch({frame}, fetch_results);
 }
 
 VectorCNN::VectorCNN(const Config& config)
-    : CnnDLSDKBase(config) {
-    if (config.enabled) {
-        Load();
-        if (output_blobs_names_.size() != 1) {
-            THROW_IE_EXCEPTION << "Demo supports topologies only with 1 output";
-        }
+        : CnnDLSDKBase(config) {
+    Load();
+    if (output_blobs_names_.size() != 1) {
+        THROW_IE_EXCEPTION << "Demo supports topologies only with 1 output";
     }
 }
 
diff --git a/demos/smart_classroom_demo/src/detector.cpp b/demos/smart_classroom_demo/src/detector.cpp
index cfc01756bb2..048539f666d 100644
--- a/demos/smart_classroom_demo/src/detector.cpp
+++ b/demos/smart_classroom_demo/src/detector.cpp
@@ -50,14 +50,10 @@ cv::Rect IncreaseRect(const cv::Rect& r, float coeff_x,
 void FaceDetection::submitRequest() {
     if (!enqueued_frames_) return;
     enqueued_frames_ = 0;
-    results_fetched_ = false;
-    results.clear();
     BaseCnnDetection::submitRequest();
 }
 
 void FaceDetection::enqueue(const cv::Mat &frame) {
-    if (!enabled()) return;
-
     if (!request) {
         request = net_.CreateInferRequestPtr();
     }
@@ -73,72 +69,62 @@ void FaceDetection::enqueue(const cv::Mat &frame) {
 }
 
 FaceDetection::FaceDetection(const DetectorConfig& config) :
-    BaseCnnDetection(config.enabled, config.is_async), config_(config) {
-    if (config.enabled) {
-        topoName = "face detector";
-        CNNNetReader net_reader;
-        net_reader.ReadNetwork(config.path_to_model);
-        net_reader.ReadWeights(config.path_to_weights);
-        if (!net_reader.isParseSuccess()) {
-            THROW_IE_EXCEPTION << "Cannot load model";
-        }
-
-        InputsDataMap inputInfo(net_reader.getNetwork().getInputsInfo());
-        if (inputInfo.size() != 1) {
-            THROW_IE_EXCEPTION << "Face Detection network should have only one input";
-        }
-        InputInfo::Ptr inputInfoFirst = inputInfo.begin()->second;
-        inputInfoFirst->setPrecision(Precision::U8);
-        inputInfoFirst->getInputData()->setLayout(Layout::NCHW);
-
-        SizeVector input_dims = inputInfoFirst->getInputData()->getTensorDesc().getDims();
-        input_dims[2] = config_.input_h;
-        input_dims[3] = config_.input_w;
-        std::map<std::string, SizeVector> input_shapes;
-        input_shapes[inputInfo.begin()->first] = input_dims;
-        net_reader.getNetwork().reshape(input_shapes);
-
-        OutputsDataMap outputInfo(net_reader.getNetwork().getOutputsInfo());
-        if (outputInfo.size() != 1) {
-            THROW_IE_EXCEPTION << "Face Detection network should have only one output";
-        }
-        DataPtr& _output = outputInfo.begin()->second;
-        output_name_ = outputInfo.begin()->first;
+        BaseCnnDetection(config.is_async), config_(config) {
+    topoName = "face detector";
+    auto cnnNetwork = config.ie.ReadNetwork(config.path_to_model);
 
-        const CNNLayerPtr outputLayer = net_reader.getNetwork().getLayerByName(output_name_.c_str());
-        if (outputLayer->type != "DetectionOutput") {
-            THROW_IE_EXCEPTION << "Face Detection network output layer(" + outputLayer->name +
-                                  ") should be DetectionOutput, but was " +  outputLayer->type;
-        }
+    InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
+    if (inputInfo.size() != 1) {
+        THROW_IE_EXCEPTION << "Face Detection network should have only one input";
+    }
+    InputInfo::Ptr inputInfoFirst = inputInfo.begin()->second;
+    inputInfoFirst->setPrecision(Precision::U8);
+    inputInfoFirst->getInputData()->setLayout(Layout::NCHW);
+
+    SizeVector input_dims = inputInfoFirst->getInputData()->getTensorDesc().getDims();
+    input_dims[2] = config_.input_h;
+    input_dims[3] = config_.input_w;
+    std::map<std::string, SizeVector> input_shapes;
+    input_shapes[inputInfo.begin()->first] = input_dims;
+    cnnNetwork.reshape(input_shapes);
+
+    OutputsDataMap outputInfo(cnnNetwork.getOutputsInfo());
+    if (outputInfo.size() != 1) {
+        THROW_IE_EXCEPTION << "Face Detection network should have only one output";
+    }
+    DataPtr& _output = outputInfo.begin()->second;
+    output_name_ = outputInfo.begin()->first;
 
-        if (outputLayer->params.find("num_classes") == outputLayer->params.end()) {
-            THROW_IE_EXCEPTION << "Face Detection network output layer (" +
-                                  output_name_ + ") should have num_classes integer attribute";
-        }
+    const CNNLayerPtr outputLayer = cnnNetwork.getLayerByName(output_name_.c_str());
+    if (outputLayer->type != "DetectionOutput") {
+        THROW_IE_EXCEPTION << "Face Detection network output layer(" + outputLayer->name +
+                              ") should be DetectionOutput, but was " +  outputLayer->type;
+    }
 
-        const SizeVector outputDims = _output->getTensorDesc().getDims();
-        max_detections_count_ = outputDims[2];
-        object_size_ = outputDims[3];
-        if (object_size_ != 7) {
-            THROW_IE_EXCEPTION << "Face Detection network output layer should have 7 as a last dimension";
-        }
-        if (outputDims.size() != 4) {
-            THROW_IE_EXCEPTION << "Face Detection network output dimensions not compatible shoulld be 4, but was " +
-                                  std::to_string(outputDims.size());
-        }
-        _output->setPrecision(Precision::FP32);
-        _output->setLayout(TensorDesc::getLayoutByDims(_output->getDims()));
+    if (outputLayer->params.find("num_classes") == outputLayer->params.end()) {
+        THROW_IE_EXCEPTION << "Face Detection network output layer (" +
+                              output_name_ + ") should have num_classes integer attribute";
+    }
 
-        input_name_ = inputInfo.begin()->first;
-        net_ = config_.ie.LoadNetwork(net_reader.getNetwork(), config_.deviceName);
+    const SizeVector outputDims = _output->getTensorDesc().getDims();
+    max_detections_count_ = outputDims[2];
+    object_size_ = outputDims[3];
+    if (object_size_ != 7) {
+        THROW_IE_EXCEPTION << "Face Detection network output layer should have 7 as a last dimension";
+    }
+    if (outputDims.size() != 4) {
+        THROW_IE_EXCEPTION << "Face Detection network output dimensions not compatible shoulld be 4, but was " +
+                              std::to_string(outputDims.size());
     }
+    _output->setPrecision(Precision::FP32);
+    _output->setLayout(TensorDesc::getLayoutByDims(_output->getDims()));
+
+    input_name_ = inputInfo.begin()->first;
+    net_ = config_.ie.LoadNetwork(cnnNetwork, config_.deviceName);
 }
 
-void FaceDetection::fetchResults() {
-    if (!enabled()) return;
-    results.clear();
-    if (results_fetched_) return;
-    results_fetched_ = true;
+DetectedObjects FaceDetection::fetchResults() {
+    DetectedObjects results;
     const float *data = request->GetBlob(output_name_)->buffer().as<float *>();
 
     for (int det_id = 0; det_id < max_detections_count_; ++det_id) {
@@ -176,4 +162,6 @@ void FaceDetection::fetchResults() {
             results.emplace_back(object);
         }
     }
+
+    return results;
 }
diff --git a/demos/smart_classroom_demo/src/image_grabber.cpp b/demos/smart_classroom_demo/src/image_grabber.cpp
index 56448f2adba..a5d39a17f2d 100644
--- a/demos/smart_classroom_demo/src/image_grabber.cpp
+++ b/demos/smart_classroom_demo/src/image_grabber.cpp
@@ -14,7 +14,6 @@ ImageGrabber::ImageGrabber(const std::string& fname) {
     } else {
         is_opened = cap.open(fname);
     }
-    cap_frame_index = -1;
     current_video_idx = 0;
     videos.push_back(fname);
     current_frame_idx = 0;
@@ -30,12 +29,7 @@ int ImageGrabber::GetFPS() const {
 
 bool ImageGrabber::IsOpened() const { return is_opened; }
 
-int ImageGrabber::GetFrameIndex() const { return cap_frame_index; }
-
-bool ImageGrabber::NextVideo() { return true; }
-
 bool ImageGrabber::GrabNext() {
-    cap_frame_index++;
     return cap.grab();
 }
 
diff --git a/demos/smart_classroom_demo/src/reid_gallery.cpp b/demos/smart_classroom_demo/src/reid_gallery.cpp
index 8743d0640e5..b4372b7c415 100644
--- a/demos/smart_classroom_demo/src/reid_gallery.cpp
+++ b/demos/smart_classroom_demo/src/reid_gallery.cpp
@@ -60,8 +60,7 @@ RegistrationStatus EmbeddingsGallery::RegisterIdentity(const std::string& identi
       detector.enqueue(image);
       detector.submitRequest();
       detector.wait();
-      detector.fetchResults();
-      detection::DetectedObjects faces = detector.results;
+      detection::DetectedObjects faces = detector.fetchResults();
       if (faces.size() == 0) {
         return RegistrationStatus::FAILURE_NOT_DETECTED;
       }
@@ -82,26 +81,30 @@ RegistrationStatus EmbeddingsGallery::RegisterIdentity(const std::string& identi
 
 EmbeddingsGallery::EmbeddingsGallery(const std::string& ids_list,
                                      double threshold, int min_size_fr,
-                                     bool crop_gallery, detection::FaceDetection& detector,
+                                     bool crop_gallery, const detection::DetectorConfig &detector_config,
                                      const VectorCNN& landmarks_det,
-                                     const VectorCNN& image_reid)
-    : reid_threshold(threshold) {
+                                     const VectorCNN& image_reid,
+                                     bool use_greedy_matcher)
+    : reid_threshold(threshold),
+      use_greedy_matcher(use_greedy_matcher) {
     if (ids_list.empty()) {
         return;
     }
 
-    if (!landmarks_det.Enabled() || !image_reid.Enabled()) {
-        return;
-    }
+    detection::FaceDetection detector(detector_config);
 
     cv::FileStorage fs(ids_list, cv::FileStorage::Mode::READ);
     cv::FileNode fn = fs.root();
-    int total_images = 0;
     int id = 0;
     for (cv::FileNodeIterator fit = fn.begin(); fit != fn.end(); ++fit) {
         cv::FileNode item = *fit;
         std::string label = item.name();
         std::vector<cv::Mat> embeddings;
+
+        // Please, note that the case when there are more than one image in gallery
+        // for a person might not work properly with the current implementation
+        // of the demo.
+        // Remove this assert by your own risk.
         CV_Assert(item.size() == 1);
 
         for (size_t i = 0; i < item.size(); i++) {
@@ -119,7 +122,6 @@ EmbeddingsGallery::EmbeddingsGallery(const std::string& ids_list,
             if (status == RegistrationStatus::SUCCESS) {
                 embeddings.push_back(emb);
                 idx_to_id.push_back(id);
-                total_images++;
                 identities.emplace_back(embeddings, label, id);
                 ++id;
             }
@@ -129,7 +131,7 @@ EmbeddingsGallery::EmbeddingsGallery(const std::string& ids_list,
 
 std::vector<int> EmbeddingsGallery::GetIDsByEmbeddings(const std::vector<cv::Mat>& embeddings) const {
     if (embeddings.empty() || idx_to_id.empty())
-        return std::vector<int>();
+        return std::vector<int>(embeddings.size(), unknown_id);
 
     cv::Mat distances(static_cast<int>(embeddings.size()), static_cast<int>(idx_to_id.size()), CV_32F);
 
@@ -142,7 +144,7 @@ std::vector<int> EmbeddingsGallery::GetIDsByEmbeddings(const std::vector<cv::Mat
             }
         }
     }
-    KuhnMunkres matcher;
+    KuhnMunkres matcher(use_greedy_matcher);
     auto matched_idx = matcher.Solve(distances);
     std::vector<int> output_ids;
     for (auto col_idx : matched_idx) {
diff --git a/demos/smart_classroom_demo/src/tracker.cpp b/demos/smart_classroom_demo/src/tracker.cpp
index 8c1efb250df..011e5d4ee55 100644
--- a/demos/smart_classroom_demo/src/tracker.cpp
+++ b/demos/smart_classroom_demo/src/tracker.cpp
@@ -17,7 +17,7 @@ const int TrackedObject::UNKNOWN_LABEL_IDX = -1;
 
 class KuhnMunkres::Impl {
 public:
-    Impl() : n_() {}
+    explicit Impl(bool greedy) : n_(), greedy_(greedy) {}
 
     std::vector<size_t> Solve(const cv::Mat &dissimilarity_matrix) {
         CV_Assert(dissimilarity_matrix.type() == CV_32F);
@@ -131,6 +131,10 @@ class KuhnMunkres::Impl {
 
     void Run() {
         TrySimpleCase();
+
+        if (greedy_)
+            return;
+
         while (!CheckIfOptimumIsFound()) {
             while (true) {
                 auto point = FindUncoveredMinValPos();
@@ -188,9 +192,10 @@ class KuhnMunkres::Impl {
     std::vector<int> is_col_visited_;
 
     int n_;
+    bool greedy_;
 };
 
-KuhnMunkres::KuhnMunkres() { impl_ = std::make_shared<Impl>(); }
+KuhnMunkres::KuhnMunkres(bool greedy) : impl_(std::make_shared<Impl>(greedy)) {}
 
 std::vector<size_t> KuhnMunkres::Solve(const cv::Mat &dissimilarity_matrix) {
     CV_Assert(impl_ != nullptr);
@@ -369,11 +374,6 @@ void Tracker::DropForgottenTracks() {
             new_tracks.emplace(reassign_id ? counter : pair.first, pair.second);
             new_active_tracks.emplace(reassign_id ? counter : pair.first);
             counter++;
-
-        } else {
-            if (IsTrackValid(pair.first)) {
-                valid_tracks_counter_++;
-            }
         }
     }
     tracks_.swap(new_tracks);
@@ -382,12 +382,6 @@ void Tracker::DropForgottenTracks() {
     tracks_counter_ = reassign_id ? counter : tracks_counter_;
 }
 
-void Tracker::DropForgottenTrack(size_t track_id) {
-    CV_Assert(IsTrackForgotten(track_id));
-    CV_Assert(active_track_ids_.count(track_id) == 0);
-    tracks_.erase(track_id);
-}
-
 float Tracker::ShapeAffinity(const cv::Rect &trk, const cv::Rect &det) {
     float w_dist = static_cast<float>(std::fabs(trk.width - det.width)) / static_cast<float>(trk.width + det.width);
     float h_dist = static_cast<float>(std::fabs(trk.height - det.height)) / static_cast<float>(trk.height + det.height);
@@ -495,19 +489,10 @@ void Tracker::Reset() {
     detections_.clear();
 
     tracks_counter_ = 0;
-    valid_tracks_counter_ = 0;
 
     frame_size_ = cv::Size();
 }
 
-size_t Tracker::Count() const {
-    size_t count = valid_tracks_counter_;
-    for (const auto &pair : tracks_) {
-        count += (IsTrackValid(pair.first) ? 1 : 0);
-    }
-    return count;
-}
-
 TrackedObjects Tracker::TrackedDetections() const {
     TrackedObjects detections;
     for (size_t idx : active_track_ids()) {
diff --git a/demos/super_resolution_demo/CMakeLists.txt b/demos/super_resolution_demo/CMakeLists.txt
index 19fa5a1deff..7e052e0b349 100644
--- a/demos/super_resolution_demo/CMakeLists.txt
+++ b/demos/super_resolution_demo/CMakeLists.txt
@@ -5,5 +5,4 @@
 ie_add_sample(NAME super_resolution_demo
               SOURCES "${CMAKE_CURRENT_SOURCE_DIR}/main.cpp"
               HEADERS "${CMAKE_CURRENT_SOURCE_DIR}/super_resolution_demo.h"
-              DEPENDENCIES format_reader
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/super_resolution_demo/README.md b/demos/super_resolution_demo/README.md
index e24a623ed86..275e10f7154 100644
--- a/demos/super_resolution_demo/README.md
+++ b/demos/super_resolution_demo/README.md
@@ -21,7 +21,7 @@ performs upscale using super resolution model.
 ## Running
 
 Running the application with the `-h` option yields the following usage message:
-```sh
+```
 ./super_resolution_demo -h
 InferenceEngine:
     API version ............ <version>
diff --git a/demos/super_resolution_demo/main.cpp b/demos/super_resolution_demo/main.cpp
index 5b81b58144a..f10d2ac869d 100644
--- a/demos/super_resolution_demo/main.cpp
+++ b/demos/super_resolution_demo/main.cpp
@@ -12,11 +12,7 @@
 #include <string>
 #include <memory>
 
-#include <format_reader_ptr.h>
 #include <inference_engine.hpp>
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 
 #include <samples/slog.hpp>
 #include <samples/args_helper.hpp>
@@ -70,18 +66,6 @@ int main(int argc, char *argv[]) {
         slog::info << "Device info: " << slog::endl;
         std::cout << ie.GetVersions(FLAGS_d) << std::endl;
 
-#ifdef WITH_EXTENSIONS
-        /** Loading default extensions **/
-        if (FLAGS_d.find("CPU") != std::string::npos) {
-            /**
-             * cpu_extensions library is compiled from "extension" folder containing
-             * custom MKLDNNPlugin layer implementations. These layers are not supported
-             * by mkldnn, but they can be useful for inferring custom topologies.
-            **/
-            ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-        }
-#endif
-
         if (!FLAGS_l.empty()) {
             // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
             IExtensionPtr extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -98,14 +82,8 @@ int main(int argc, char *argv[]) {
         // --------------------------- 2. Read IR Generated by ModelOptimizer (.xml and .bin files) ------------
         slog::info << "Loading network files" << slog::endl;
 
-        CNNNetReader networkReader;
         /** Read network model **/
-        networkReader.ReadNetwork(FLAGS_m);
-
-        /** Extract model name and load weights **/
-        std::string binFileName = fileNameNoExt(FLAGS_m) + ".bin";
-        networkReader.ReadWeights(binFileName);
-        CNNNetwork network = networkReader.getNetwork();
+        auto network = ie.ReadNetwork(FLAGS_m);
         // -----------------------------------------------------------------------------------------------------
 
         // --------------------------- 3. Configure input & output ---------------------------------------------
@@ -124,18 +102,18 @@ int main(int argc, char *argv[]) {
         /** Collect images**/
         std::vector<cv::Mat> inputImages;
         for (const auto &i : imageNames) {
-            cv::Mat img = cv::imread(i, cv::IMREAD_UNCHANGED);
-            if (img.empty()) {
-                slog::warn << "Image " + i + " cannot be read!" << slog::endl;
-                continue;
-            }
-
             /** Get size of low resolution input **/
             auto lrInputInfoItem = inputInfo[lrInputBlobName];
             int w = static_cast<int>(lrInputInfoItem->getTensorDesc().getDims()[3]);
             int h = static_cast<int>(lrInputInfoItem->getTensorDesc().getDims()[2]);
             int c = static_cast<int>(lrInputInfoItem->getTensorDesc().getDims()[1]);
 
+            cv::Mat img = cv::imread(i, c == 1 ? cv::IMREAD_GRAYSCALE : cv::IMREAD_COLOR);
+            if (img.empty()) {
+                slog::warn << "Image " + i + " cannot be read!" << slog::endl;
+                continue;
+            }
+
             if (w != img.cols || h != img.rows) {
                 slog::warn << "Size of the image " << i << " is not equal to WxH = " << w << "x" << h << slog::endl;
                 continue;
diff --git a/demos/super_resolution_demo/super_resolution_demo.h b/demos/super_resolution_demo/super_resolution_demo.h
index aa82ba9094b..f97a0fcc73d 100644
--- a/demos/super_resolution_demo/super_resolution_demo.h
+++ b/demos/super_resolution_demo/super_resolution_demo.h
@@ -9,60 +9,27 @@
 #include <gflags/gflags.h>
 #include <iostream>
 
-/// @brief message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief message for images argument
 static const char image_message[] = "Required. Path to an image.";
-
-/// @brief message for model argument
-static const char model_message[] = "Required. Path to an .xml file with a trained model.";\
-
-/// @brief message for plugin argument
-static const char plugin_message[] = "Plugin name. For example MKLDNNPlugin. If this parameter is pointed, " \
-"the demo will look for this plugin only";
-
-/// @brief message for assigning cnn calculation to device
-static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). " \
-                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. " \
+static const char model_message[] = "Required. Path to an .xml file with a trained model.";
+static const char plugin_message[] = "Plugin name. For example MKLDNNPlugin. If this parameter is pointed, "
+                                     "the demo will look for this plugin only";
+static const char target_device_message[] = "Optional. Specify the target device to infer on (the list of available devices is shown below). "
+                                            "Default value is CPU. Use \"-d HETERO:<comma-separated_devices_list>\" format to specify HETERO plugin. "
                                             "The demo will look for a suitable plugin for the specified device.";
-
-/// @brief message for user library argument
-static const char custom_cpu_library_message[] = "Required for CPU custom layers." \
+static const char custom_cpu_library_message[] = "Required for CPU custom layers."
                                                  "Absolute path to a shared library with the kernels implementations.";
-
-/// @brief message for clDNN custom kernels desc
-static const char custom_cldnn_message[] = "Required for GPU custom kernels."\
+static const char custom_cldnn_message[] = "Required for GPU custom kernels."
                                             "Absolute path to the xml file with the kernels descriptions.";
-
-/// @brief message for show argument
 static const char show_processed_images[] = "Optional. Show processed images. Default value is false.";
 
 
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for set image file <br>
-/// It is a required parameter
 DEFINE_string(i, "", image_message);
-
-/// @brief Define parameter for set model file <br>
-/// It is a required parameter
 DEFINE_string(m, "", model_message);
-
-/// @brief device the target device to infer on <br>
 DEFINE_string(d, "CPU", target_device_message);
-
-/// @brief Absolute path to CPU library with user layers <br>
-/// It is a required parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Define parameter for clDNN custom kernels path <br>
-/// Default is ./lib
 DEFINE_string(c, "", custom_cldnn_message);
-
-/// @brief Flag to show processed images<br>
-/// It is an optional parameter
 DEFINE_bool(show, false, show_processed_images);
 
 /**
diff --git a/demos/tests/args.py b/demos/tests/args.py
index 5df36eb6347..9512697c048 100644
--- a/demos/tests/args.py
+++ b/demos/tests/args.py
@@ -18,7 +18,8 @@
 from pathlib import Path
 
 ArgContext = collections.namedtuple('ArgContext',
-    ['test_data_dir', 'dl_dir', 'model_info', 'image_sequences', 'image_sequence_dir'])
+    ['source_dir', 'test_data_dir', 'dl_dir', 'model_info', 'data_sequences', 'data_sequence_dir'])
+
 
 class TestDataArg:
     def __init__(self, rel_path):
@@ -27,9 +28,19 @@ def __init__(self, rel_path):
     def resolve(self, context):
         return str(context.test_data_dir / self.rel_path)
 
+
 def image_net_arg(id):
     return TestDataArg('ILSVRC2012_img_val/ILSVRC2012_val_{}.JPEG'.format(id))
 
+
+def brats_arg(id):
+    return TestDataArg('BraTS/{}'.format(id))
+
+
+def image_retrieval_arg(id):
+    return TestDataArg('Image_Retrieval/{}'.format(id))
+
+
 class ModelArg:
     def __init__(self, name, precision='FP32'):
         self.name = name
@@ -38,16 +49,17 @@ def __init__(self, name, precision='FP32'):
     def resolve(self, context):
         return str(context.dl_dir / context.model_info[self.name]["subdirectory"] / self.precision / (self.name + '.xml'))
 
-class ImagePatternArg:
+
+class DataPatternArg:
     def __init__(self, sequence_name):
         self.sequence_name = sequence_name
 
     def resolve(self, context):
-        seq_dir = context.image_sequence_dir / self.sequence_name
-        seq = [Path(image.resolve(context))
-            for image in context.image_sequences[self.sequence_name]]
+        seq_dir = context.data_sequence_dir / self.sequence_name
+        seq = [Path(data.resolve(context))
+            for data in context.data_sequences[self.sequence_name]]
 
-        assert len(set(image.suffix for image in seq)) == 1, "all images in the sequence must have the same extension"
+        assert len(set(data.suffix for data in seq)) == 1, "all images in the sequence must have the same extension"
         assert '%' not in seq[0].suffix
 
         name_format = 'input-%04d' + seq[0].suffix
@@ -55,15 +67,24 @@ def resolve(self, context):
         if not seq_dir.is_dir():
             seq_dir.mkdir(parents=True)
 
-            for index, image in enumerate(context.image_sequences[self.sequence_name]):
-                shutil.copyfile(image.resolve(context), str(seq_dir / (name_format % index)))
+            for index, data in enumerate(context.data_sequences[self.sequence_name]):
+                shutil.copyfile(data.resolve(context), str(seq_dir / (name_format % index)))
 
         return str(seq_dir / name_format)
 
-class ImageDirectoryArg:
+
+class DataDirectoryArg:
     def __init__(self, sequence_name):
-        self.backend = ImagePatternArg(sequence_name)
+        self.backend = DataPatternArg(sequence_name)
 
     def resolve(self, context):
         pattern = self.backend.resolve(context)
         return str(Path(pattern).parent)
+
+
+class DemoFileArg:
+    def __init__(self, file_name):
+        self.file_name = file_name
+
+    def resolve(self, context):
+        return str(context.source_dir / self.file_name)
diff --git a/demos/tests/cases.py b/demos/tests/cases.py
index 555a959f588..c5e43676043 100644
--- a/demos/tests/cases.py
+++ b/demos/tests/cases.py
@@ -16,44 +16,60 @@
 import sys
 
 from args import *
-from image_sequences import IMAGE_SEQUENCES
-
-ALL_DEVICES = ['CPU', 'GPU']
+from data_sequences import DATA_SEQUENCES
 
+MONITORS = {'-u': 'cdm'}
 TestCase = collections.namedtuple('TestCase', ['options'])
 
-class NativeDemo:
-    def __init__(self, name, test_cases):
-        self._name = name
+class Demo:
+
+    def device_args(self, device_list):
+        if len(self.device_keys) == 0:
+            return {'CPU': []}
+        return {device: [arg for key in self.device_keys for arg in [key, device]] for device in device_list}
+
+class NativeDemo(Demo):
+    def __init__(self, subdirectory, device_keys, test_cases):
+        self.subdirectory = subdirectory
+
+        self.device_keys = device_keys
 
         self.test_cases = test_cases
 
+        self._name = subdirectory.replace('/', '_')
+
     @property
     def full_name(self):
         return self._name
 
     def models_lst_path(self, source_dir):
-        return source_dir / self._name / 'models.lst'
+        return source_dir / self.subdirectory / 'models.lst'
 
     def fixed_args(self, source_dir, build_dir):
         return [str(build_dir / self._name)]
 
-class PythonDemo:
-    def __init__(self, name, test_cases):
-        self._name = name
+class PythonDemo(Demo):
+    def __init__(self, subdirectory, device_keys, test_cases):
+        self.subdirectory = 'python_demos/' + subdirectory
+
+        self.device_keys = device_keys
 
         self.test_cases = test_cases
 
+        self._name = subdirectory.replace('/', '_')
+
     @property
     def full_name(self):
         return 'py/' + self._name
 
     def models_lst_path(self, source_dir):
-        return source_dir / 'python_demos' / self._name / 'models.lst'
+        return source_dir / self.subdirectory / 'models.lst'
 
     def fixed_args(self, source_dir, build_dir):
+        cpu_extension_path = build_dir / 'lib/libcpu_extension.so'
+
         return [sys.executable, str(source_dir / 'python_demos' / self._name / (self._name + '.py')),
-            '-l', str(build_dir / 'lib/libcpu_extension.so')]
+            *(['-l', str(cpu_extension_path)] if cpu_extension_path.exists() else [])]
 
 def join_cases(*args):
     options = {}
@@ -67,23 +83,30 @@ def combine_cases(*args):
 def single_option_cases(key, *args):
     return [TestCase(options={} if arg is None else {key: arg}) for arg in args]
 
-def device_cases(*args):
-    return [TestCase(options={opt: device for opt in args}) for device in ALL_DEVICES]
 
 NATIVE_DEMOS = [
-    NativeDemo(name='crossroad_camera_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='crossroad_camera_demo',
+            device_keys=['-d', '-d_pa', '-d_reid'],
+            test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImagePatternArg('person-vehicle-bike-detection-crossroad')}),
-        device_cases('-d', '-d_pa', '-d_reid'),
+            **MONITORS,
+            '-i': DataPatternArg('person-vehicle-bike-detection-crossroad')}),
         TestCase(options={'-m': ModelArg('person-vehicle-bike-detection-crossroad-0078')}),
         single_option_cases('-m_pa', None, ModelArg('person-attributes-recognition-crossroad-0230')),
-        single_option_cases('-m_reid', None, ModelArg('person-reidentification-retail-0079')),
+        single_option_cases('-m_reid',
+            None,
+            ModelArg('person-reidentification-retail-0031'),
+            ModelArg('person-reidentification-retail-0103'),
+            ModelArg('person-reidentification-retail-0107'),
+            ModelArg('person-reidentification-retail-0200')),
     )),
 
-    NativeDemo(name='gaze_estimation_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='gaze_estimation_demo',
+            device_keys=['-d', '-d_fd', '-d_hp', '-d_lm'],
+            test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImagePatternArg('gaze-estimation-adas')}),
-        device_cases('-d', '-d_fd', '-d_hp', '-d_lm'),
+            **MONITORS,
+            '-i': DataPatternArg('gaze-estimation-adas')}),
         TestCase(options={
             '-m': ModelArg('gaze-estimation-adas-0002'),
             '-m_fd': ModelArg('face-detection-adas-0001'),
@@ -92,17 +115,19 @@ def device_cases(*args):
         }),
     )),
 
-    NativeDemo(name='human_pose_estimation_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='human_pose_estimation_demo', device_keys=['-d'], test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImagePatternArg('human-pose-estimation')}),
-        device_cases('-d'),
+            **MONITORS,
+            '-i': DataPatternArg('human-pose-estimation')}),
         TestCase(options={'-m': ModelArg('human-pose-estimation-0001')}),
     )),
 
-    NativeDemo(name='interactive_face_detection_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='interactive_face_detection_demo',
+            device_keys=['-d', '-d_ag', '-d_em', '-d_lm', '-d_hp'],
+            test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImagePatternArg('face-detection-adas')}),
-        device_cases('-d', '-d_ag', '-d_em', '-d_lm', '-d_hp'),
+            **MONITORS,
+            '-i': DataPatternArg('face-detection-adas')}),
         TestCase(options={'-m': ModelArg('face-detection-adas-0001')}),
         [
             TestCase(options={}),
@@ -119,120 +144,250 @@ def device_cases(*args):
         ],
     )),
 
-    # TODO: mask_rcnn_demo
+    NativeDemo(subdirectory='mask_rcnn_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'-i': DataDirectoryArg('semantic-segmentation-adas')}),
+        single_option_cases('-m',
+            ModelArg('mask_rcnn_inception_resnet_v2_atrous_coco'),
+            ModelArg('mask_rcnn_inception_v2_coco'),
+            ModelArg('mask_rcnn_resnet101_atrous_coco'),
+            ModelArg('mask_rcnn_resnet50_atrous_coco'))
+    )),
 
-    # TODO: multichannel demos
+    NativeDemo(subdirectory='multi_channel/face_detection_demo',
+            device_keys=['-d'],
+            test_cases=combine_cases(
+        TestCase(options={'-no_show': None,
+            **MONITORS,
+            '-i': DATA_SEQUENCES['face-detection-adas']}),
+        single_option_cases('-m',
+            ModelArg('face-detection-adas-0001'),
+            ModelArg('face-detection-adas-binary-0001', "FP32-INT1"),
+            ModelArg('face-detection-retail-0004'),
+            ModelArg('face-detection-retail-0005'),
+            ModelArg('face-detection-retail-0044')),
+    )),
 
-    # TODO: object_detection_demo_faster_rcnn
+    NativeDemo(subdirectory='multi_channel/human_pose_estimation_demo', device_keys=['-d'],
+            test_cases=combine_cases(
+        TestCase(options={'-no_show': None,
+            **MONITORS,
+            '-i': DATA_SEQUENCES['human-pose-estimation'],
+            '-m': ModelArg('human-pose-estimation-0001')}),
+    )),
 
-    NativeDemo(name='object_detection_demo_ssd_async', test_cases=combine_cases(
-        TestCase(options={'-no_show': None}),
+    NativeDemo(subdirectory='object_detection_demo_ssd_async', device_keys=[], test_cases=combine_cases(
+        TestCase(options={'-no_show': None, **MONITORS}),
         [
             TestCase(options={
                 '-m': ModelArg('face-detection-adas-0001'),
-                '-i': ImagePatternArg('face-detection-adas'),
+                '-i': DataPatternArg('face-detection-adas'),
             }),
             TestCase(options={
                 '-m': ModelArg('person-detection-retail-0002'),
-                '-i': ImagePatternArg('person-detection-retail'),
+                '-i': DataPatternArg('person-detection-retail'),
             }),
             TestCase(options={
                 '-m': ModelArg('person-detection-retail-0013'),
-                '-i': ImagePatternArg('person-detection-retail'),
+                '-i': DataPatternArg('person-detection-retail'),
             }),
         ],
     )),
 
-    # TODO: object_detection_demo_yolov3_async
+    # TODO: object_detection_demo_yolov3_async: no models.lst
 
-    NativeDemo('pedestrian_tracker_demo', test_cases=combine_cases(
+    NativeDemo('pedestrian_tracker_demo', device_keys=['-d_det', '-d_reid'], test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImageDirectoryArg('person-detection-retail')}),
-        device_cases('-d_det', '-d_reid'),
+            **MONITORS,
+            '-i': DataPatternArg('person-detection-retail')}),
         [
             TestCase(options={'-m_det': ModelArg('person-detection-retail-0002')}),
             TestCase(options={'-m_det': ModelArg('person-detection-retail-0013')}),
         ],
         single_option_cases('-m_reid',
             ModelArg('person-reidentification-retail-0031'),
-            ModelArg('person-reidentification-retail-0076'),
-            ModelArg('person-reidentification-retail-0079')),
+            ModelArg('person-reidentification-retail-0103'),
+            ModelArg('person-reidentification-retail-0107'),
+            ModelArg('person-reidentification-retail-0200')),
     )),
 
-    NativeDemo(name='security_barrier_camera_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='security_barrier_camera_demo',
+            device_keys=['-d', '-d_lpr', '-d_va'],
+            test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImageDirectoryArg('vehicle-license-plate-detection-barrier')}),
-        device_cases('-d', '-d_lpr', '-d_va'),
+            **MONITORS,
+            '-i': DataDirectoryArg('vehicle-license-plate-detection-barrier')}),
         TestCase(options={'-m': ModelArg('vehicle-license-plate-detection-barrier-0106')}),
-        single_option_cases('-m_lpr', None, ModelArg('license-plate-recognition-barrier-0001')),
+        single_option_cases('-m_lpr',
+            None,
+            ModelArg('license-plate-recognition-barrier-0001'),
+            ModelArg('license-plate-recognition-barrier-0007')),
         single_option_cases('-m_va', None, ModelArg('vehicle-attributes-recognition-barrier-0039')),
     )),
 
-    NativeDemo(name='segmentation_demo', test_cases=combine_cases(
-        device_cases('-d'),
+    NativeDemo(subdirectory='segmentation_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'-no_show': None, **MONITORS}),
         [
             TestCase(options={
                 '-m': ModelArg('road-segmentation-adas-0001'),
-                '-i': ImageDirectoryArg('road-segmentation-adas'),
-            }),
-            TestCase(options={
-                '-m': ModelArg('semantic-segmentation-adas-0001'),
-                '-i': ImageDirectoryArg('semantic-segmentation-adas'),
+                '-i': DataPatternArg('road-segmentation-adas'),
             }),
+            *combine_cases(
+                TestCase(options={'-i': DataPatternArg('semantic-segmentation-adas')}),
+                single_option_cases('-m',
+                    ModelArg('semantic-segmentation-adas-0001'),
+                    ModelArg('deeplabv3'))),
         ],
     )),
 
-    NativeDemo(name='smart_classroom_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='smart_classroom_demo',
+            device_keys=['-d_act', '-d_fd', '-d_lm', '-d_reid'],
+            test_cases=combine_cases(
         TestCase(options={'-no_show': None,
-            '-i': ImagePatternArg('smart-classroom-demo'),
+            **MONITORS,
+            '-i': DataPatternArg('smart-classroom-demo'),
             '-m_fd': ModelArg('face-detection-adas-0001')}),
-        device_cases('-d_act', '-d_fd', '-d_lm', '-d_reid'),
         [
             *combine_cases(
-                single_option_cases('-m_act',
-                    ModelArg('person-detection-action-recognition-0005'),
-                    ModelArg('person-detection-action-recognition-0006'),
-                    ModelArg('person-detection-action-recognition-teacher-0002')),
-                single_option_cases('-m_lm', None, ModelArg('landmarks-regression-retail-0009')),
-                single_option_cases('-m_reid', None, ModelArg('face-reidentification-retail-0095'))),
+                [
+                    TestCase(options={'-m_act': ModelArg('person-detection-action-recognition-0005')}),
+                    TestCase(options={'-m_act': ModelArg('person-detection-action-recognition-0006'),
+                        '-student_ac': 'sitting,writing,raising_hand,standing,turned_around,lie_on_the_desk'}),
+                    # person-detection-action-recognition-teacher-0002 is supposed to be provided with -teacher_id, but
+                    # this would require providing a gallery file with -fg key. Unless -teacher_id is provided
+                    # -teacher_ac is ignored thus run the test just with default actions pretending it's about students
+                    TestCase(options={'-m_act': ModelArg('person-detection-action-recognition-teacher-0002')}),
+                ],
+                [
+                    TestCase(options={}),
+                    TestCase(options={
+                        '-m_lm': ModelArg('landmarks-regression-retail-0009'),
+                        '-m_reid': ModelArg('face-reidentification-retail-0095'),
+                    }),
+                ],
+            ),
             TestCase(options={'-m_act': ModelArg('person-detection-raisinghand-recognition-0001'), '-a_top': '5'}),
         ],
     )),
 
-    NativeDemo(name='super_resolution_demo', test_cases=combine_cases(
-        TestCase(options={'-i': ImageDirectoryArg('single-image-super-resolution')}),
-        device_cases('-d'),
+    NativeDemo(subdirectory='super_resolution_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'-i': DataDirectoryArg('single-image-super-resolution')}),
         TestCase(options={
             '-m': ModelArg('single-image-super-resolution-1033'),
         }),
     )),
 
-    NativeDemo(name='text_detection_demo', test_cases=combine_cases(
+    NativeDemo(subdirectory='text_detection_demo', device_keys=['-d_td', '-d_tr'], test_cases=combine_cases(
         TestCase(options={'-no_show': None, '-dt': 'video',
-            '-i': ImagePatternArg('text-detection')}),
-        device_cases('-d_td', '-d_tr'),
+            **MONITORS,
+            '-i': DataPatternArg('text-detection')}),
         single_option_cases('-m_td', ModelArg('text-detection-0003'), ModelArg('text-detection-0004')),
         single_option_cases('-m_tr', None, ModelArg('text-recognition-0012')),
     )),
 ]
 
 PYTHON_DEMOS = [
-    # TODO: 3d_segmentation_demo
-    # TODO: action_recognition
-    # TODO: instance_segmentation_demo
-    # TODO: object_detection_demo_ssd_async
-    # TODO: object_detection_demo_yolov3_async
-
-    PythonDemo(name='segmentation_demo', test_cases=combine_cases(
-        device_cases('-d'),
+    PythonDemo(subdirectory='3d_segmentation_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'-m': ModelArg('brain-tumor-segmentation-0001'),
+                          '-o': '.'}),
+        single_option_cases('-i', *DATA_SEQUENCES['brain-tumor-nifti']),
+    )),
+
+    PythonDemo(subdirectory='action_recognition', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'--no_show': None, '-i': DataPatternArg('action-recognition')}),
+        [
+            TestCase(options={
+                '-m_en': ModelArg('action-recognition-0001-encoder'),
+                '-m_de': ModelArg('action-recognition-0001-decoder'),
+            }),
+            TestCase(options={
+                '-m_en': ModelArg('driver-action-recognition-adas-0002-encoder'),
+                '-m_de': ModelArg('driver-action-recognition-adas-0002-decoder'),
+            }),
+        ],
+    )),
+
+    PythonDemo(subdirectory='face_recognition_demo', device_keys=['-d_fd', '-d_lm', '-d_reid'],
+               test_cases=combine_cases(
+        TestCase(options={'--no_show': None,
+                          '-i': DataPatternArg('face-detection-adas'),
+                          '-fg': DataDirectoryArg('face-recognition-gallery')
+                          }),
+        single_option_cases('-m_fd',
+            ModelArg('face-detection-adas-0001'),
+            ModelArg('face-detection-adas-binary-0001', "FP32-INT1"),
+            ModelArg('face-detection-retail-0004'),
+            ModelArg('face-detection-retail-0005'),
+            ModelArg('face-detection-retail-0044')),
+        TestCase(options={'-m_lm': ModelArg('landmarks-regression-retail-0009')}),
+        TestCase(options={'-m_reid': ModelArg('face-reidentification-retail-0095')}),
+    )),
+
+    PythonDemo(subdirectory='human_pose_estimation_3d_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'--no_show': None,
+                          '-i': DataPatternArg('human-pose-estimation')}),
+        TestCase(options={'-m': ModelArg('human-pose-estimation-3d-0001')}),
+    )),
+
+    PythonDemo(subdirectory='image_retrieval_demo', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'--no_show':None,
+                          '-m': ModelArg('image-retrieval-0001')}),
+        single_option_cases('-i', *DATA_SEQUENCES['image-retrieval-video']),
+        single_option_cases('-g', image_retrieval_arg('gallery.txt')),
+    )),
+
+    PythonDemo(subdirectory='instance_segmentation_demo', device_keys=[], test_cases=combine_cases(
+        TestCase(options={'--no_show': None,
+            '-i': DataPatternArg('instance-segmentation'),
+            '--delay': '1',
+            '-d': 'CPU',  # GPU is not supported
+            '--labels': DemoFileArg('coco_labels.txt')}),
+        single_option_cases('-m',
+            ModelArg('instance-segmentation-security-0010'),
+            ModelArg('instance-segmentation-security-0050'),
+            ModelArg('instance-segmentation-security-0083')),
+    )),
+
+    PythonDemo(subdirectory='multi_camera_multi_person_tracking', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'--no_show': None,
+            '-i': [DataPatternArg('multi-camera-multi-person-tracking'),
+                DataPatternArg('multi-camera-multi-person-tracking/repeated')],
+            '-m': ModelArg('person-detection-retail-0013')}),
+        single_option_cases('--m_reid',
+            ModelArg('person-reidentification-retail-0031'),
+            ModelArg('person-reidentification-retail-0103'),
+            ModelArg('person-reidentification-retail-0107'),
+            ModelArg('person-reidentification-retail-0200')),
+    )),
+
+    PythonDemo(subdirectory='object_detection_demo_ssd_async', device_keys=['-d'], test_cases=combine_cases(
+        TestCase(options={'--no_show': None,
+            '-i': DataPatternArg('object-detection-demo-ssd-async')}),
+        single_option_cases('-m',
+            ModelArg('face-detection-adas-0001'),
+            ModelArg('face-detection-adas-binary-0001', "FP32-INT1"),
+            ModelArg('face-detection-retail-0004'),
+            ModelArg('face-detection-retail-0005'),
+            ModelArg('face-detection-retail-0044'),
+            ModelArg('pedestrian-and-vehicle-detector-adas-0001'),
+            ModelArg('pedestrian-detection-adas-0002'),
+            ModelArg('pedestrian-detection-adas-binary-0001', "FP32-INT1"),
+            ModelArg('person-detection-retail-0013'),
+            ModelArg('vehicle-detection-adas-0002'),
+            ModelArg('vehicle-detection-adas-binary-0001', "FP32-INT1"),
+            ModelArg('vehicle-license-plate-detection-barrier-0106')),
+    )),
+
+    # TODO: object_detection_demo_yolov3_async: no models.lst
+
+    PythonDemo(subdirectory='segmentation_demo', device_keys=['-d'], test_cases=combine_cases(
         [
             TestCase(options={
                 '-m': ModelArg('road-segmentation-adas-0001'),
-                '-i': IMAGE_SEQUENCES['road-segmentation-adas'],
+                '-i': DATA_SEQUENCES['road-segmentation-adas'],
             }),
             TestCase(options={
                 '-m': ModelArg('semantic-segmentation-adas-0001'),
-                '-i': IMAGE_SEQUENCES['semantic-segmentation-adas'],
+                '-i': DATA_SEQUENCES['semantic-segmentation-adas'],
             }),
         ],
     )),
diff --git a/demos/tests/image_sequences.py b/demos/tests/data_sequences.py
similarity index 62%
rename from demos/tests/image_sequences.py
rename to demos/tests/data_sequences.py
index 17d4ba48683..2692f545650 100644
--- a/demos/tests/image_sequences.py
+++ b/demos/tests/data_sequences.py
@@ -12,9 +12,36 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-from args import image_net_arg
+from args import image_net_arg, brats_arg, image_retrieval_arg
+
+DATA_SEQUENCES = {
+    'action-recognition': [
+        image_net_arg('00000001'),
+        image_net_arg('00000002'),
+        image_net_arg('00000003'),
+        image_net_arg('00000004'),
+        image_net_arg('00000005'),
+        image_net_arg('00000006'),
+        image_net_arg('00000007'),
+        image_net_arg('00000008'),
+        image_net_arg('00000009'),
+        image_net_arg('00000010'),
+        image_net_arg('00000011'),
+        image_net_arg('00000012'),
+        image_net_arg('00000013'),
+        image_net_arg('00000014'),
+        image_net_arg('00000015'),
+        image_net_arg('00000016'),
+        image_net_arg('00000017'),
+        image_net_arg('00000018'),
+        image_net_arg('00000019'),
+        image_net_arg('00000020'),
+    ],
+
+    'brain-tumor-nifti': [
+        brats_arg('BRATS_485.nii.gz'),
+    ],
 
-IMAGE_SEQUENCES = {
     'face-detection-adas': [
         image_net_arg('00000002'),
         image_net_arg('00000032'),
@@ -28,6 +55,12 @@
         image_net_arg('00045630'),
     ],
 
+    'face-recognition-gallery': [
+        image_net_arg('00000184'),
+        image_net_arg('00008165'),
+        image_net_arg('00040548'),
+    ],
+
     'gaze-estimation-adas': [
         image_net_arg('00008165'),
         image_net_arg('00008170'),
@@ -54,17 +87,66 @@
         image_net_arg('00048311'),
     ],
 
+    'image-retrieval-video': [
+        image_retrieval_arg('4946fb41-9da0-4af7-a858-b443bee6d0f6.dav'),
+    ],
+
+    'instance-segmentation': [
+        image_net_arg('00000001'),
+        image_net_arg('00000002'),
+        image_net_arg('00000002'), # the demo has simple reid
+        image_net_arg('00000003'),
+        image_net_arg('00000004'),
+        image_net_arg('00000008'),
+        image_net_arg('00000010'),
+        image_net_arg('00000017'),
+        image_net_arg('00000019'),
+        image_net_arg('00000020'),
+    ],
+
+    'multi-camera-multi-person-tracking': [
+        image_net_arg('00000002'),
+        image_net_arg('00000032'),
+        image_net_arg('00017291'),
+        image_net_arg('00017293'),
+        image_net_arg('00040547'),
+        image_net_arg('00000002'),
+        image_net_arg('00000032'),
+        image_net_arg('00017291'),
+        image_net_arg('00017293'),
+        image_net_arg('00040547'),
+        image_net_arg('00000002'),
+    ],
+
+    'multi-camera-multi-person-tracking/repeated': [image_net_arg('00000002')] * 11,
+
+    'object-detection-demo-ssd-async': [
+        image_net_arg('00000001'),
+        image_net_arg('00000002'),
+        image_net_arg('00000003'),
+        image_net_arg('00000004'),
+        image_net_arg('00000005'),
+        image_net_arg('00000006'),
+        image_net_arg('00000007'),
+        image_net_arg('00000008'),
+        image_net_arg('00000014'),
+        image_net_arg('00000018'),
+        image_net_arg('00000022'),
+        image_net_arg('00000023'),
+        image_net_arg('00000032'),
+    ],
+
     'person-detection-retail': [
+        image_net_arg('00000002'),
+        image_net_arg('00000002'),
+        image_net_arg('00000002'),
+        image_net_arg('00000002'),
         image_net_arg('00000002'),
         image_net_arg('00000032'),
-        image_net_arg('00000184'),
-        image_net_arg('00000442'),
-        image_net_arg('00008165'),
+        image_net_arg('00000002'),
         image_net_arg('00017291'),
         image_net_arg('00017293'),
         image_net_arg('00040547'),
-        image_net_arg('00040548'),
-        image_net_arg('00040554'),
     ],
 
     'person-vehicle-bike-detection-crossroad': [
@@ -110,6 +192,16 @@
         image_net_arg('00005409'),
     ],
 
+    'smart-classroom-demo': [
+        image_net_arg('00000074'),
+        image_net_arg('00000164'),
+        image_net_arg('00000181'),
+        image_net_arg('00000164'),
+        image_net_arg('00000181'),
+        image_net_arg('00000001'),
+        image_net_arg('00000074'),
+    ],
+
     'text-detection': [
         image_net_arg('00000032'),
         image_net_arg('00001893'),
@@ -135,16 +227,4 @@
         image_net_arg('00037128'),
         image_net_arg('00048316'),
     ],
-
-    'smart-classroom-demo': [
-        image_net_arg('00000074'),
-        image_net_arg('00000141'),
-        image_net_arg('00000141'),
-        image_net_arg('00000164'),
-        image_net_arg('00000181'),
-        image_net_arg('00000164'),
-        image_net_arg('00000181'),
-        image_net_arg('00000001'),
-        image_net_arg('00000074'),
-    ],
 }
diff --git a/demos/tests/run_tests.py b/demos/tests/run_tests.py
old mode 100755
new mode 100644
index f20bbd777aa..7ce42925f60
--- a/demos/tests/run_tests.py
+++ b/demos/tests/run_tests.py
@@ -17,25 +17,32 @@
 """
 Test script for the demos.
 
-For the tests to work, the test data directory must contain a "ILSVRC2012_img_val"
-subdirectory with the ILSVRC2012 dataset.
+For the tests to work, the test data directory must contain:
+* a "BraTS" subdirectory with brain tumor dataset in NIFTI format (see http://medicaldecathlon.com,
+  https://drive.google.com/open?id=1A2IU8Sgea1h3fYLpYtFb2v7NYdMjvEhU);
+* a "ILSVRC2012_img_val" subdirectory with the ILSVRC2012 dataset;
+* a "Image_Retrieval" subdirectory with image retrieval dataset (images, videos) (see https://github.com/19900531/test)
+  and list of images (see https://github.com/opencv/openvino_training_extensions/blob/develop/tensorflow_toolkit/image_retrieval/data/gallery/gallery.txt)
 """
 
 import argparse
 import collections
+import csv
 import itertools
 import json
+import os
 import shlex
 import shutil
 import subprocess
 import sys
 import tempfile
+import timeit
 
 from pathlib import Path
 
-from args import ArgContext
+from args import ArgContext, ModelArg
 from cases import DEMOS
-from image_sequences import IMAGE_SEQUENCES
+from data_sequences import DATA_SEQUENCES
 
 def parse_args():
     parser = argparse.ArgumentParser(
@@ -48,8 +55,23 @@ def parse_args():
         help='directory to use as the cache for the model downloader')
     parser.add_argument('--demos', metavar='DEMO[,DEMO...]',
         help='list of demos to run tests for (by default, every demo is tested)')
+    parser.add_argument('--mo', type=Path, metavar='MO.PY',
+        help='Model Optimizer entry point script')
+    parser.add_argument('--devices', default="CPU GPU",
+        help='list of devices to test')
+    parser.add_argument('--report-file', type=Path,
+        help='path to report file')
     return parser.parse_args()
 
+def collect_result(demo_name, device, pipeline, execution_time, report_file):
+    first_time = not report_file.exists()
+    pipeline.sort()
+    with report_file.open('a+', newline='') as csvfile:
+        testwriter = csv.writer(csvfile)
+        if first_time:
+            testwriter.writerow(["DemoName", "Device", "ModelsInPipeline", "ExecutionTime"])
+        testwriter.writerow([demo_name, device, " ".join(pipeline), execution_time])
+
 def main():
     args = parse_args()
 
@@ -69,6 +91,8 @@ def main():
 
     num_failures = 0
 
+    os.putenv('PYTHONPATH',  "{}:{}/lib".format(os.environ['PYTHONPATH'], args.demo_build_dir))
+
     for demo in DEMOS:
         if demo.full_name not in demos_to_test: continue
 
@@ -94,12 +118,26 @@ def main():
                 num_failures += len(demo.test_cases)
                 continue
 
+            try:
+                subprocess.check_output(
+                    [
+                        sys.executable, '--', str(auto_tools_dir / 'converter.py'),
+                        '--download_dir', str(dl_dir), '--list', str(demo.models_lst_path(demos_dir)), '--jobs', 'auto',
+                    ] + ([] if args.mo is None else ['--mo', str(args.mo)]),
+                    stderr=subprocess.STDOUT, universal_newlines=True)
+            except subprocess.CalledProcessError as e:
+                print(e.output)
+                print('Exit code:', e.returncode)
+                num_failures += len(demo.test_cases)
+                continue
+
             print()
 
             arg_context = ArgContext(
+                source_dir=demos_dir / demo.subdirectory,
                 dl_dir=dl_dir,
-                image_sequence_dir=Path(temp_dir) / 'image_seq',
-                image_sequences=IMAGE_SEQUENCES,
+                data_sequence_dir=Path(temp_dir) / 'data_seq',
+                data_sequences=DATA_SEQUENCES,
                 model_info=model_info,
                 test_data_dir=args.test_data_dir,
             )
@@ -117,23 +155,32 @@ def option_to_args(key, value):
 
             print('Fixed arguments:', ' '.join(map(shlex.quote, fixed_args)))
             print()
-
+            device_args = demo.device_args(args.devices.split())
             for test_case_index, test_case in enumerate(demo.test_cases):
+
                 case_args = [demo_arg
                     for key, value in sorted(test_case.options.items())
                     for demo_arg in option_to_args(key, value)]
 
-                print('Test case #{}:'.format(test_case_index + 1),
-                    ' '.join(shlex.quote(str(arg)) for arg in case_args))
-                print(flush=True)
-
-                try:
-                    subprocess.check_output(fixed_args + case_args,
-                        stderr=subprocess.STDOUT, universal_newlines=True)
-                except subprocess.CalledProcessError as e:
-                    print(e.output)
-                    print('Exit code:', e.returncode)
-                    num_failures += 1
+                pipeline = [value.name for key, value in test_case.options.items() if isinstance(value, ModelArg)]
+
+                for device, dev_arg in device_args.items():
+                    print('Test case #{}/{}:'.format(test_case_index, device),
+                        ' '.join(shlex.quote(str(arg)) for arg in dev_arg + case_args))
+                    print(flush=True)
+                    try:
+                        start_time = timeit.default_timer()
+                        subprocess.check_output(fixed_args + dev_arg + case_args,
+                            stderr=subprocess.STDOUT, universal_newlines=True)
+                        execution_time = timeit.default_timer() - start_time
+                    except subprocess.CalledProcessError as e:
+                        print(e.output)
+                        print('Exit code:', e.returncode)
+                        num_failures += 1
+                        execution_time = -1
+
+                    if args.report_file:
+                        collect_result(demo.full_name, device, pipeline, execution_time, args.report_file)
 
         print()
 
diff --git a/demos/text_detection_demo/CMakeLists.txt b/demos/text_detection_demo/CMakeLists.txt
index 92e342c995c..df1f6a367e6 100644
--- a/demos/text_detection_demo/CMakeLists.txt
+++ b/demos/text_detection_demo/CMakeLists.txt
@@ -9,4 +9,5 @@ ie_add_sample(NAME text_detection_demo
               SOURCES ${SOURCES}
               HEADERS ${HEADERS}
               INCLUDE_DIRECTORIES "${CMAKE_CURRENT_SOURCE_DIR}/include"
+              DEPENDENCIES monitors
               OPENCV_DEPENDENCIES highgui)
diff --git a/demos/text_detection_demo/README.md b/demos/text_detection_demo/README.md
index 7434fc216e3..8712f9c4fd3 100644
--- a/demos/text_detection_demo/README.md
+++ b/demos/text_detection_demo/README.md
@@ -20,7 +20,7 @@ If text recognition model is provided, the demo prints recognized text as well.
 ## Running
 
 Running the application with the <code>-h</code> option yields the following usage message:
-```sh
+```
 ./text_detection_demo -h
 
 text_detection_demo [OPTION]
@@ -32,7 +32,7 @@ Options:
     -m_tr "<path>"               Required. Path to the Text Recognition model (.xml) file.
     -dt "<input_data_type>"      Required. Input data type: "image" (for a single image), "list" (for a text file where images paths are listed), "video" (for a saved video), "webcam" (for a webcamera device). By default, it is "image".
     -m_tr_ss "<value>"           Optional. Symbol set for the Text Recognition model.
-    -cc                          Optional. If it is set, then in case of absence of the Text Detector, the Text Reconition model takes a central image crop as an input, but not full frame.
+    -cc                          Optional. If it is set, then in case of absence of the Text Detector, the Text Recognition model takes a central image crop as an input, but not full frame.
     -w_td "<value>"              Optional. Input image width for Text Detection model.
     -h_td "<value>"              Optional. Input image height for Text Detection model.
     -thr "<value>"               Optional. Specify a recognition confidence threshold. Text detection candidates with text recognition confidence below specified threshold are rejected.
@@ -45,6 +45,8 @@ Options:
     -c "<absolute_path>"         Optional. Absolute path to the GPU kernels implementation for custom layers.
     -no_show                     Optional. If it is true, then detected text will not be shown on image frame. By default, it is false.
     -r                           Optional. Output Inference results as raw values.
+    -u                           Optional. List of monitors to show initially.
+    -b                           Optional. Bandwidth for CTC beam search decoder. Default value is 0, in this case CTC greedy decoder will be used.
 ```
 
 Running the application with the empty list of options yields the usage message given above and an error message.
diff --git a/demos/text_detection_demo/include/text_recognition.hpp b/demos/text_detection_demo/include/text_recognition.hpp
index 656a7639255..60433ac92e8 100644
--- a/demos/text_detection_demo/include/text_recognition.hpp
+++ b/demos/text_detection_demo/include/text_recognition.hpp
@@ -8,3 +8,4 @@
 #include <vector>
 
 std::string CTCGreedyDecoder(const std::vector<float> &data, const std::string& alphabet, char pad_symbol, double *conf);
+std::string CTCBeamSearchDecoder(const std::vector<float> &data, const std::string& alphabet, char pad_symbol, double *conf, int bandwidth);
diff --git a/demos/text_detection_demo/main.cpp b/demos/text_detection_demo/main.cpp
index e511f153437..c39f87b6e86 100644
--- a/demos/text_detection_demo/main.cpp
+++ b/demos/text_detection_demo/main.cpp
@@ -18,11 +18,9 @@
 #include <gflags/gflags.h>
 #include <opencv2/opencv.hpp>
 
-#ifdef WITH_EXTENSIONS
-#include <ext_list.hpp>
-#endif
 #include <inference_engine.hpp>
 
+#include <monitors/presenter.h>
 #include <samples/common.hpp>
 #include <samples/slog.hpp>
 
@@ -40,7 +38,7 @@ std::vector<cv::Point2f> floatPointsFromRotatedRect(const cv::RotatedRect &rect)
 std::vector<cv::Point> boundedIntPointsFromRotatedRect(const cv::RotatedRect &rect, const cv::Size& image_size);
 cv::Point topLeftPoint(const std::vector<cv::Point2f> & points, int *idx);
 cv::Mat cropImage(const cv::Mat &image, const std::vector<cv::Point2f> &points, const cv::Size& target_size, int top_left_point_idx);
-void setLabel(cv::Mat& im, const std::string label, const cv::Point & p);
+void setLabel(cv::Mat& im, const std::string& label, const cv::Point & p);
 
 bool ParseAndCheckCommandLine(int argc, char *argv[]) {
     // ------------------------- Parsing and validating input arguments --------------------------------------
@@ -111,10 +109,6 @@ int main(int argc, char *argv[]) {
 
             /** Load extensions for the CPU device **/
             if ((device.find("CPU") != std::string::npos)) {
-#ifdef WITH_EXTENSIONS
-                ie.AddExtension(std::make_shared<Extensions::Cpu::CpuExtensions>(), "CPU");
-#endif
-
                 if (!FLAGS_l.empty()) {
                     // CPU(MKLDNN) extensions are loaded as a shared library and passed as a pointer to base extension
                     auto extension_ptr = make_so_pointer<IExtension>(FLAGS_l);
@@ -135,6 +129,7 @@ int main(int argc, char *argv[]) {
         auto extension_path = FLAGS_l;
         auto cls_conf_threshold = static_cast<float>(FLAGS_cls_pixel_thr);
         auto link_conf_threshold = static_cast<float>(FLAGS_link_pixel_thr);
+        auto decoder_bandwidth = FLAGS_b;
 
         slog::info << "Loading network files" << slog::endl;
         Cnn text_detection, text_recognition;
@@ -160,6 +155,9 @@ int main(int argc, char *argv[]) {
         }
         std::cout << std::endl;
 
+        cv::Size graphSize{static_cast<int>(image.cols / 4), 60};
+        Presenter presenter(FLAGS_u, image.rows - graphSize.height - 10, graphSize);
+
         while (!image.empty()) {
             cv::Mat demo_image = image.clone();
             cv::Size orig_image_size = image.size();
@@ -222,11 +220,15 @@ int main(int argc, char *argv[]) {
                     if (output_shape[2] != kAlphabet.length())
                         throw std::runtime_error("The text recognition model does not correspond to alphabet.");
 
-                    float *ouput_data_pointer = blobs.begin()->second->buffer().as<PrecisionTrait<Precision::FP32>::value_type *>();
-                    std::vector<float> output_data(ouput_data_pointer, ouput_data_pointer + output_shape[0] * output_shape[2]);
+                    float *output_data_pointer = blobs.begin()->second->buffer().as<PrecisionTrait<Precision::FP32>::value_type *>();
+                    std::vector<float> output_data(output_data_pointer, output_data_pointer + output_shape[0] * output_shape[2]);
 
                     std::chrono::steady_clock::time_point begin = std::chrono::steady_clock::now();
-                    res = CTCGreedyDecoder(output_data, kAlphabet, kPadSymbol, &conf);
+                    if (decoder_bandwidth == 0) {
+                        res = CTCGreedyDecoder(output_data, kAlphabet, kPadSymbol, &conf);
+                    } else {
+                        res = CTCBeamSearchDecoder(output_data, kAlphabet, kPadSymbol, &conf, decoder_bandwidth);
+                    }
                     std::chrono::steady_clock::time_point end = std::chrono::steady_clock::now();
                     text_recognition_postproc_time += std::chrono::duration_cast<std::chrono::microseconds>(end - begin).count();
 
@@ -272,12 +274,15 @@ int main(int argc, char *argv[]) {
             }
             int fps = static_cast<int>(1000 / avg_time);
 
+            presenter.drawGraphs(demo_image);
+
             if (!FLAGS_no_show) {
                 cv::putText(demo_image, "fps: " + std::to_string(fps) + " found: " + std::to_string(num_found),
                             cv::Point(50, 50), cv::FONT_HERSHEY_COMPLEX, 1, cv::Scalar(0, 0, 255), 1);
                 cv::imshow("Press ESC key to exit", demo_image);
-                char k = static_cast<char>(cv::waitKey(wait_time));
+                char k = cv::waitKey(wait_time);
                 if (k == 27) break;
+                presenter.handleKey(k);
             }
 
             grabber->GrabNextImage(&image);
@@ -384,7 +389,7 @@ cv::Mat cropImage(const cv::Mat &image, const std::vector<cv::Point2f> &points,
     return crop;
 }
 
-void setLabel(cv::Mat& im, const std::string label, const cv::Point & p) {
+void setLabel(cv::Mat& im, const std::string& label, const cv::Point & p) {
     int fontface = cv::FONT_HERSHEY_SIMPLEX;
     double scale = 0.7;
     int thickness = 1;
diff --git a/demos/text_detection_demo/src/cnn.cpp b/demos/text_detection_demo/src/cnn.cpp
index 08f4a409f55..1a4d610ae21 100644
--- a/demos/text_detection_demo/src/cnn.cpp
+++ b/demos/text_detection_demo/src/cnn.cpp
@@ -15,18 +15,14 @@ void Cnn::Init(const std::string &model_path, Core & ie, const std::string & dev
     // ---------------------------------------------------------------------------------------------------
 
     // --------------------------- 1. Reading network ----------------------------------------------------
-    CNNNetReader network_reader;
-    network_reader.ReadNetwork(model_path);
-    network_reader.ReadWeights(fileNameNoExt(model_path) + ".bin");
-    network_reader.getNetwork().setBatchSize(1);
+    auto network = ie.ReadNetwork(model_path);
+    network.setBatchSize(1);
 
     model_path_ = model_path;
 
-    CNNNetwork network = network_reader.getNetwork();
-
     // --------------------------- Changing input shape if it is needed ----------------------------------
     if (new_input_resolution != cv::Size()) {
-        InputsDataMap inputInfo(network_reader.getNetwork().getInputsInfo());
+        InputsDataMap inputInfo(network.getInputsInfo());
         if (inputInfo.size() != 1) {
             THROW_IE_EXCEPTION << "The network should have only one input";
         }
diff --git a/demos/text_detection_demo/src/text_detection.cpp b/demos/text_detection_demo/src/text_detection.cpp
index a415c096720..eab8501765e 100644
--- a/demos/text_detection_demo/src/text_detection.cpp
+++ b/demos/text_detection_demo/src/text_detection.cpp
@@ -159,17 +159,17 @@ cv::Mat decodeImageByJoin(const std::vector<float> &cls_data, const std::vector<
         link_mask[i] = link_data[i] >= link_conf_threshold;
     }
 
-    int neighbours = link_data_shape[3];
+    size_t neighbours = size_t(link_data_shape[3]);
     for (const auto &point : points) {
-        int neighbour = 0;
+        size_t neighbour = 0;
         for (int ny = point.y - 1; ny <= point.y + 1; ny++) {
             for (int nx = point.x - 1; nx <= point.x + 1; nx++) {
                 if (nx == point.x && ny == point.y)
                     continue;
                 if (nx >= 0 && nx < w && ny >= 0 && ny < h) {
-                    uchar pixel_value = pixel_mask[static_cast<size_t>(ny * w + nx)];
-                    uchar link_value = link_mask[static_cast<size_t>(point.y * w * neighbours +
-                                                                     point.x * neighbours + neighbour)];
+                    uchar pixel_value = pixel_mask[size_t(ny) * size_t(w) + size_t(nx)];
+                    uchar link_value = link_mask[
+                        (size_t(point.y) * size_t(w) + size_t(point.x)) * neighbours + neighbour];
                     if (pixel_value && link_value) {
                         join(point.x + point.y * w, nx + ny * w, &group_mask);
                     }
diff --git a/demos/text_detection_demo/src/text_recognition.cpp b/demos/text_detection_demo/src/text_recognition.cpp
index c22d2538aa0..1c57ca3c43e 100644
--- a/demos/text_detection_demo/src/text_recognition.cpp
+++ b/demos/text_detection_demo/src/text_recognition.cpp
@@ -10,9 +10,10 @@
 #include <vector>
 #include <limits>
 #include <stdexcept>
+#include <numeric>
 
 namespace  {
-    void softmax(const std::vector<float>::const_iterator& begin, const std::vector<float>::const_iterator& end, int *argmax, float *prob) {
+    void softmax_and_choose(const std::vector<float>::const_iterator& begin, const std::vector<float>::const_iterator& end, int *argmax, float *prob) {
         auto max_element = std::max_element(begin, end);
         *argmax = static_cast<int>(std::distance(begin, max_element));
         float max_val = *max_element;
@@ -25,6 +26,27 @@ namespace  {
         }
         *prob = 1.0f / static_cast<float>(sum);
     }
+
+    std::vector<float> softmax(const std::vector<float>::const_iterator& begin, const std::vector<float>::const_iterator& end) {
+        std::vector<float> prob(end - begin, 0.f);
+        std::transform(begin, end, prob.begin(), [](float x) { return std::exp(x); });
+        float sum = std::accumulate(prob.begin(), prob.end(), 0.0f);
+        for (int i = 0; i < static_cast<int>(prob.size()); i++)
+            prob[i] /= sum;
+        return prob;
+    }
+
+    struct BeamElement {
+        std::vector<int> sentence;   //!< The sequence of chars that will be a result of the beam element
+        float prob_blank;            //!< The probability that the last char in CTC sequence
+                                     //!< for the beam element is the special blank char
+        float prob_not_blank;        //!< The probability that the last char in CTC sequence
+                                     //!< for the beam element is NOT the special blank char
+
+        float prob() const {         //!< The probability of the beam element.
+            return prob_blank + prob_not_blank;
+        }
+    };
 }  // namespace
 
 std::string CTCGreedyDecoder(const std::vector<float> &data, const std::string& alphabet, char pad_symbol, double *conf) {
@@ -37,7 +59,7 @@ std::string CTCGreedyDecoder(const std::vector<float> &data, const std::string&
       int argmax;
       float prob;
 
-      softmax(it, it + num_classes, &argmax, &prob);
+      softmax_and_choose(it, it + num_classes, &argmax, &prob);
 
       (*conf) *= prob;
 
@@ -53,3 +75,80 @@ std::string CTCGreedyDecoder(const std::vector<float> &data, const std::string&
     }
     return res;
 }
+
+std::string CTCBeamSearchDecoder(const std::vector<float> &data, const std::string& alphabet, char pad_symbol, double *conf, int bandwidth) {
+    const int num_classes = alphabet.length();
+
+    std::vector<BeamElement> curr;
+    std::vector<BeamElement> last;
+
+    last.push_back(BeamElement{std::vector<int>(), 1.f, 0.f});
+
+    for (std::vector<float>::const_iterator it = data.begin(); it != data.end(); it += num_classes) {
+        curr.clear();
+
+        std::vector<float> prob = softmax(it, it + num_classes);
+
+        for(const auto& candidate: last) {
+            float prob_not_blank = 0.f;
+            const std::vector<int>& candidate_sentence = candidate.sentence;
+            if (!candidate_sentence.empty()) {
+                int n = candidate_sentence.back();
+                prob_not_blank = candidate.prob_not_blank * prob[n];
+            }
+            float prob_blank = candidate.prob() * prob[num_classes - 1];
+
+            auto check_res = std::find_if(curr.begin(), curr.end(), [&candidate_sentence](const BeamElement& n) {
+                return n.sentence == candidate_sentence;
+            });
+            if (check_res == std::end(curr)) {
+                curr.push_back(BeamElement{candidate.sentence, prob_blank, prob_not_blank});
+            } else {
+                check_res->prob_not_blank  += prob_not_blank;
+                if (check_res->prob_blank != 0.f) {
+                    throw std::logic_error("Probability that the last char in CTC-sequence is the special blank char must be zero here");
+                }
+                check_res->prob_blank = prob_blank;
+            }
+
+            for (int i = 0; i < num_classes - 1; i++) {
+                auto extend = candidate_sentence;
+                extend.push_back(i);
+
+                if (candidate_sentence.size() > 0 && candidate.sentence.back() == i) {
+                    prob_not_blank = prob[i] * candidate.prob_blank;
+                } else {
+                    prob_not_blank = prob[i] * candidate.prob();
+                }
+                
+                auto check_res = std::find_if(curr.begin(), curr.end(), [&extend](const BeamElement &n) {
+                    return n.sentence == extend;
+                });
+
+                if (check_res == std::end(curr)) {
+                    curr.push_back(BeamElement{extend, 0.f, prob_not_blank});
+                } else {
+                    check_res->prob_not_blank += prob_not_blank;
+                }
+            }
+        }
+
+        sort(curr.begin(), curr.end(), [](const BeamElement &a, const BeamElement &b) -> bool {
+            return a.prob() > b.prob();
+        });
+
+        last.clear();
+        int num_to_copy = std::min(bandwidth, static_cast<int>(curr.size()));
+        for (int b = 0; b < num_to_copy; b++) {
+            last.push_back(curr[b]);
+        }
+    }
+
+    *conf = last[0].prob();
+    std::string res="";
+    for (const auto& idx: last[0].sentence) {
+        res += alphabet[idx];
+    }
+
+    return res;
+}
diff --git a/demos/text_detection_demo/text_detection_demo.hpp b/demos/text_detection_demo/text_detection_demo.hpp
index 717f077db33..a01589015d6 100644
--- a/demos/text_detection_demo/text_detection_demo.hpp
+++ b/demos/text_detection_demo/text_detection_demo.hpp
@@ -9,149 +9,63 @@
 #include <vector>
 #include <gflags/gflags.h>
 
-/// @brief Message for help argument
 static const char help_message[] = "Print a usage message.";
-
-/// @brief Message for input path argument
 static const char input_message[] = "Required. Path to an image or video file, to a text file with paths to images, "
                                     "or to a webcamera device node (for example, /dev/video0).";
-
-/// @brief Message for text detection model argument
 static const char text_detection_model_message[] = "Required. Path to the Text Detection model (.xml) file.";
-
-/// @brief Message for text recognition model argument
 static const char text_recognition_model_message[] = "Required. Path to the Text Recognition model (.xml) file.";
-
-/// @brief Message for text recognition model symbols set argument
 static const char text_recognition_model_symbols_set_message[] = "Optional. Symbol set for the Text Recognition model.";
-
-/// @brief Message for central image crop argument
 static const char text_central_image_crop_message[] = "Optional. If it is set, then in case of absence of the Text Detector, "
-                                                      "the Text Reconition model takes a central image crop as an input, but not full frame.";
-
-/// @brief Message for input image width for text detection model argument
+                                                      "the Text Recognition model takes a central image crop as an input, but not full frame.";
 static const char image_width_for_text_detection_model_message[] = "Optional. Input image width for Text Detection model.";
-
-/// @brief Message for input image height for text detection model argument
 static const char image_height_for_text_detection_model_message[] = "Optional. Input image height for Text Detection model.";
-
-/// @brief Message for text recognition threshold argument
 static const char text_recognition_threshold_message[] = "Optional. Specify a recognition confidence threshold. Text detection candidates with "
                                                          "text recognition confidence below specified threshold are rejected.";
-
-/// @brief Message for pixel classification threshold argument
 static const char pixel_classification_threshold_message[] = "Optional. Specify a confidence threshold for pixel classification. "
                                                              "Pixels with classification confidence below specified threshold are rejected.";
-
-/// @brief Message for pixel linkage threshold argument
 static const char pixel_linkage_threshold_message[] = "Optional. Specify a confidence threshold for pixel linkage. "
                                                       "Pixels with linkage confidence below specified threshold are not linked.";
-
-/// @brief Message for max rectangles number argument
 static const char text_max_rectangles_number_message[] = "Optional. Maximum number of rectangles to recognize. "
                                                          "If it is negative, number of rectangles to recognize is not limited.";
-
-/// @brief Message for text detection target device argument
 static const char text_detection_target_device_message[] = "Optional. Specify the target device for the Text Detection model to infer on "
                                                            "(the list of available devices is shown below). "
                                                            "The demo will look for a suitable plugin for a specified device. By default, it is CPU.";
-
-/// @brief Message for text recognition target device argument
 static const char text_recognition_target_device_message[] = "Optional. Specify the target device for the Text Recognition model to infer on "
                                                              "(the list of available devices is shown below). "
                                                              "The demo will look for a suitable plugin for a specified device. By default, it is CPU.";
-
-/// @brief Message for user library argument
 static const char custom_cpu_library_message[] = "Optional. Absolute path to a shared library with the CPU kernels implementation "
                                                  "for custom layers.";
-
-/// @brief Message for user library argument
 static const char custom_gpu_library_message[] = "Optional. Absolute path to the GPU kernels implementation for custom layers.";
-
-/// @brief Message for user no_show argument
 static const char no_show_message[] = "Optional. If it is true, then detected text will not be shown on image frame. By default, it is false.";
-
-/// @brief Message raw output flag
 static const char raw_output_message[] = "Optional. Output Inference results as raw values.";
-
-/// @brief Message for input data type argument
 static const char input_data_type_message[] = "Required. Input data type: \"image\" (for a single image), "
                                               "\"list\" (for a text file where images paths are listed), "
                                               "\"video\" (for a saved video), "
                                               "\"webcam\" (for a webcamera device). By default, it is \"image\".";
+static const char utilization_monitors_message[] = "Optional. List of monitors to show initially.";
+static const char decoder_bandwidth_message[] = "Optional. Bandwidth for CTC beam search decoder. Default value is 0, in this case CTC greedy decoder will be used.";
 
-/// @brief Define flag for showing help message <br>
 DEFINE_bool(h, false, help_message);
-
-/// @brief Define parameter for setting input path <br>
-/// It is a required parameter
 DEFINE_string(i, "", input_message);
-
-/// @brief Define parameter for text detection model file <br>
-/// It is a required parameter
 DEFINE_string(m_td, "", text_detection_model_message);
-
-/// @brief Define parameter for text recognition model file <br>
-/// It is a required parameter
 DEFINE_string(m_tr, "", text_recognition_model_message);
-
-/// @brief Define parameter for text recognition model symbols set <br>
-/// It is a optional parameter
 DEFINE_string(m_tr_ss, "0123456789abcdefghijklmnopqrstuvwxyz", text_recognition_model_symbols_set_message);
-
-/// @brief Define parameter for central image crop. <br>
-/// It is a optional parameter
 DEFINE_bool(cc, false, text_central_image_crop_message);
-
-/// @brief Define parameter for input image width for text detection model <br>
-/// It is a optional parameter
 DEFINE_int32(w_td, 1280, image_width_for_text_detection_model_message);
-
-/// @brief Define parameter for input image height for text detection model <br>
-/// It is a optional parameter
 DEFINE_int32(h_td, 768, image_height_for_text_detection_model_message);
-
-/// @brief Define parameter for text recognition threshold <br>
-/// It is a optional parameter
 DEFINE_double(thr, 0.2, text_recognition_threshold_message);
-
-/// @brief Define parameter for pixel classification threshold <br>
-/// It is a optional parameter
 DEFINE_double(cls_pixel_thr, 0.8, pixel_classification_threshold_message);
-
-/// @brief Define parameter for pixel linking threshold <br>
-/// It is a optional parameter
 DEFINE_double(link_pixel_thr, 0.8, pixel_linkage_threshold_message);
-
-/// @brief Define parameter for maximum number of rectangles to recognize. If it is negative number of rectangles to recognize is not limited. <br>
-/// It is a optional parameter
 DEFINE_int32(max_rect_num, -1, text_max_rectangles_number_message);
-
-/// @brief Define parameter for input data type ("image", "list", "video", "webcam"). <br>
-/// It is a required parameter
 DEFINE_string(dt, "", input_data_type_message);
-
-/// @brief Define the target device for text detection model to infer on <br>
 DEFINE_string(d_td, "CPU", text_detection_target_device_message);
-
-/// @brief Define the target device for text recognition model to infer on <br>
 DEFINE_string(d_tr, "CPU", text_recognition_target_device_message);
-
-/// @brief Define parameter for asolute path to a shared library with the CPU kernels implementation for custom layers. <br>
-/// It is a optional parameter
 DEFINE_string(l, "", custom_cpu_library_message);
-
-/// @brief Define parameter for asolute path to the GPU kernels implementation for custom layers. <br>
-/// It is a optional parameter
 DEFINE_string(c, "", custom_gpu_library_message);
-
-/// @brief Define a flag to not show detected text on image frame. By default, it is false. <br>
-/// It is an optional parameter
 DEFINE_bool(no_show, false, no_show_message);
-
-/// @brief Flag to output raw pipeline results<br>
-/// It is an optional parameter
 DEFINE_bool(r, false, raw_output_message);
+DEFINE_string(u, "", utilization_monitors_message);
+DEFINE_uint32(b, 0, decoder_bandwidth_message);
 
 /**
 * @brief This function shows a help message
@@ -180,4 +94,6 @@ static void showUsage() {
     std::cout << "    -c \"<absolute_path>\"         " << custom_gpu_library_message << std::endl;
     std::cout << "    -no_show                     " << no_show_message << std::endl;
     std::cout << "    -r                           " << raw_output_message << std::endl;
+    std::cout << "    -u                           " << utilization_monitors_message << std::endl;
+    std::cout << "    -b                           " << decoder_bandwidth_message << std::endl;
 }
diff --git a/models/intel/action-recognition-0001-decoder/description/action-recognition-0001-decoder.md b/models/intel/action-recognition-0001-decoder/description/action-recognition-0001-decoder.md
index 4c7e72eb7af..db4599d035b 100644
--- a/models/intel/action-recognition-0001-decoder/description/action-recognition-0001-decoder.md
+++ b/models/intel/action-recognition-0001-decoder/description/action-recognition-0001-decoder.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is an general-purpose action recognition model for Kinetics-400 dataset. The model uses Video Transformer approach with ResNet34 encoder.
+This is a general-purpose action recognition model for Kinetics-400 dataset. The model uses Video Transformer approach with ResNet34 encoder.
 Please refer to the [kinetics](https://deepmind.com/research/open-source/open-source-datasets/kinetics/) dataset specification to see list of action that are recognised by this model.
 
 This model is only decoder part of the whole pipeline. It accepts stack of frame embeddings, computed by action-recognition-0001-encoder, and produces prediction on input video. Video frames should be sampled to cover ~1 second fragment (i.e. skip every second frame in 30 fps video).
diff --git a/models/intel/action-recognition-0001-decoder/model.yml b/models/intel/action-recognition-0001-decoder/model.yml
index 0ab5e229a65..7c39000f01d 100644
--- a/models/intel/action-recognition-0001-decoder/model.yml
+++ b/models/intel/action-recognition-0001-decoder/model.yml
@@ -13,32 +13,25 @@
 # limitations under the License.
 
 description: >-
-  This is an general-purpose action recognition model for Kinetics-400 dataset.
-  The model uses Video Transformer approach with ResNet34 encoder. Please refer
-  to the kinetics <https://deepmind.com/research/open-source/open-source-datasets/kinetics/>
-  dataset specification to see list of action that are recognised by this model.
-
-  This model is only decoder part of the whole pipeline. It accepts stack of frame
-  embeddings, computed by action-recognition-0001-encoder, and produces prediction
-  on input video. Video frames should be sampled to cover ~1 second fragment (i.e.
-  skip every second frame in 30 fps video).
+  General-purpose action recognition model for Kinetics-400 dataset based on Video
+  Transformer Network approach. Decoder part
 task_type: action_recognition
 files:
   - name: FP32/action-recognition-0001-decoder.xml
-    size: 104114
-    sha256: 8fa144ca38792c7ea040fa0903156e0ddb48ad55e7691b3c901e02d8562ac8a2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.xml
+    size: 117064
+    sha256: 662329658703c2e69659be688f48d900fe56adf7a467d1f7511e18443e2ef87a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.xml
   - name: FP32/action-recognition-0001-decoder.bin
-    size: 30238472
-    sha256: 493bbfe6ae4b362c01dee751e1bcd3f13b24ec7c24d6f26f5034fc0d268b8c65
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.bin
+    size: 30238776
+    sha256: 94b20a3d531c2f72fa4230aaed22ed9140f8923ed60907cbf1a0a48147d7663d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.bin
   - name: FP16/action-recognition-0001-decoder.xml
-    size: 104078
-    sha256: 420a1353ccc74fe4d87bfb3d3b7f7a9aad88fb80aea8a45d6572a1538a6db409
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.xml
+    size: 117024
+    sha256: cee9b6fd416bfab880fe1e782d1705ee799d60b7ef84615a7c26c80d92efef43
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.xml
   - name: FP16/action-recognition-0001-decoder.bin
-    size: 15119336
-    sha256: 504fab429c1f31864fbe02b8ec6ecc39d0f13947d2afbf65d7d4ce7d457330c0
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.bin
+    size: 15119512
+    sha256: 04108ac97f6815a1929b0cf3a6a5b539b28236ea7cf6bd4329011ca768257f23
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/action-recognition-0001-encoder/description/action-recognition-0001-encoder.md b/models/intel/action-recognition-0001-encoder/description/action-recognition-0001-encoder.md
index dca69465a2d..281461761f4 100644
--- a/models/intel/action-recognition-0001-encoder/description/action-recognition-0001-encoder.md
+++ b/models/intel/action-recognition-0001-encoder/description/action-recognition-0001-encoder.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is an general-purpose action recognition model for Kinetics-400 dataset. The model uses Video Transformer approach with ResNet34 encoder.
+This is a general-purpose action recognition model for Kinetics-400 dataset. The model uses Video Transformer approach with ResNet34 encoder.
 Please refer to the [kinetics](https://deepmind.com/research/open-source/open-source-datasets/kinetics/) dataset specification to see list of action that are recognised by this model.
 
 This model is only encoder part of the whole pipeline. It accepts video frame and produces embedding.
diff --git a/models/intel/action-recognition-0001-encoder/model.yml b/models/intel/action-recognition-0001-encoder/model.yml
index e9cd1387dd4..43ed1f8e05a 100644
--- a/models/intel/action-recognition-0001-encoder/model.yml
+++ b/models/intel/action-recognition-0001-encoder/model.yml
@@ -13,32 +13,25 @@
 # limitations under the License.
 
 description: >-
-  This is an general-purpose action recognition model for Kinetics-400 dataset.
-  The model uses Video Transformer approach with ResNet34 encoder. Please refer
-  to the kinetics <https://deepmind.com/research/open-source/open-source-datasets/kinetics/>
-  dataset specification to see list of action that are recognised by this model.
-
-  This model is only encoder part of the whole pipeline. It accepts video frame
-  and produces embedding. Use action-recognition-0001-decoder to produce prediction
-  from embeddings of 16 frames. Video frames should be sampled to cover ~1 second
-  fragment (i.e. skip every second frame in 30 fps video).
+  General-purpose action recognition model for Kinetics-400 dataset based on Video
+  Transformer Network approach. Encoder part
 task_type: action_recognition
 files:
   - name: FP32/action-recognition-0001-encoder.xml
-    size: 49054
-    sha256: 7c04f243aecb06427720aa5df772fe31c3adcd33014a684913369cfabc0f8c69
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.xml
+    size: 98459
+    sha256: 27a2f6b6a53f5c860c729bb532fc50f0d8e84e180f6e99a97c1de1c292e5e728
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.xml
   - name: FP32/action-recognition-0001-encoder.bin
     size: 85104664
     sha256: c33e24b3f74918104eeafc106ee7f0b56804f03b87098c14ad66af6386cdb648
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.bin
   - name: FP16/action-recognition-0001-encoder.xml
-    size: 49014
-    sha256: d8e78c551b578028a8f3da671c4283622e367385d6c7eab6d3c000cf631e5997
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.xml
+    size: 98419
+    sha256: 901c3ab3b9134db90c1ef2fa4b523fa4ddc795de9fbeb250ddefce466ea83e39
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.xml
   - name: FP16/action-recognition-0001-encoder.bin
     size: 42552332
     sha256: 57d374b873dc87c72e5baab53245d59f1b866f6e2c3e670c923537f45018782c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/age-gender-recognition-retail-0013/model.yml b/models/intel/age-gender-recognition-retail-0013/model.yml
index 815ef3da6cb..1a543a00bbc 100644
--- a/models/intel/age-gender-recognition-retail-0013/model.yml
+++ b/models/intel/age-gender-recognition-retail-0013/model.yml
@@ -13,26 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Fully convolutional network for simultaneous Age/Gender recognition. The network
-  is able to recognize age of people in [18, 75] years old range, it is not applicable
-  for children since their faces were not in the training set.
+  Age & gender classification. Used in Audience Analytics.
 task_type: object_attributes
 files:
   - name: FP32/age-gender-recognition-retail-0013.xml
-    size: 14883
-    sha256: 9accd7693ca200340b9651e333517bbceee68c3b11c1d3be0413eb667909aea5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/age-gender-recognition-retail-0013/FP32/age-gender-recognition-retail-0013.xml
+    size: 30006
+    sha256: ca2c4826b9370038643d97a434bb9621adea4baf4279e5b9c3a83002456fd755
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP32/age-gender-recognition-retail-0013.xml
   - name: FP32/age-gender-recognition-retail-0013.bin
     size: 8552076
     sha256: 4dab79cfedebd628f3327367a91c9736a32fbf9cc733cbbf1629d16910d4ace7
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/age-gender-recognition-retail-0013/FP32/age-gender-recognition-retail-0013.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP32/age-gender-recognition-retail-0013.bin
   - name: FP16/age-gender-recognition-retail-0013.xml
-    size: 14873
-    sha256: 6d5c05b968c1b68f1bbf3ee9b36dc53f01dee1b396936864dd7265fc074ea357
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/age-gender-recognition-retail-0013/FP16/age-gender-recognition-retail-0013.xml
+    size: 29996
+    sha256: a375a5d8617ff1913dfc1210f5bb07493d72293c0efa87c1abcdfe181ae8a2b0
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP16/age-gender-recognition-retail-0013.xml
   - name: FP16/age-gender-recognition-retail-0013.bin
     size: 4276038
     sha256: 401101e0a01b3d68add39deae833bcf9f54238d37dd13e3fb1534aa8fbe4719d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/age-gender-recognition-retail-0013/FP16/age-gender-recognition-retail-0013.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP16/age-gender-recognition-retail-0013.bin
+  - name: FP32-INT8/age-gender-recognition-retail-0013.xml
+    size: 64387
+    sha256: 930b5e2ef06d890a79e91f16ecbe54ce08abcb6923cfb56afa464750588d7a21
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP32-INT8/age-gender-recognition-retail-0013.xml
+  - name: FP32-INT8/age-gender-recognition-retail-0013.bin
+    size: 8565952
+    sha256: 0efcef2c78fa5208d85d2eb5fc69955c6d97a2ba2948c67a75b0dcb3b74da41e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/age-gender-recognition-retail-0013/FP32-INT8/age-gender-recognition-retail-0013.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/asl-recognition-0004/description/asl-recognition-0004.jpg b/models/intel/asl-recognition-0004/description/asl-recognition-0004.jpg
new file mode 100644
index 00000000000..aa04fe4fe14
Binary files /dev/null and b/models/intel/asl-recognition-0004/description/asl-recognition-0004.jpg differ
diff --git a/models/intel/asl-recognition-0004/description/asl-recognition-0004.md b/models/intel/asl-recognition-0004/description/asl-recognition-0004.md
new file mode 100644
index 00000000000..e94b097b100
--- /dev/null
+++ b/models/intel/asl-recognition-0004/description/asl-recognition-0004.md
@@ -0,0 +1,43 @@
+# asl-recognition-0004
+
+## Use Case and High-Level Description
+
+A human gesture recognition model for the American Sign Language (ASL) recognition scenario 
+(word-level recognition). The model uses an S3D framework with MobileNet V3 backbone. Please refer 
+to the [MS-ASL-100\*](https://www.microsoft.com/en-us/research/project/ms-asl/) dataset specification 
+to see the list of gestures that are recognized by this model.
+
+The model accepts a stack of frames sampled with a constant framerate (15 FPS) and produces a prediction
+on the input clip.
+
+## Example
+
+![](./asl-recognition-0004.jpg)
+
+## Specification
+
+| Metric                          | Value                                     |
+|---------------------------------|-------------------------------------------|
+| Top-1 accuracy (MS-ASL-100\*)   | 0.847                                     |
+| GFlops                          | 6.660                                     |
+| MParams                         | 4.133                                     |
+| Source framework                | PyTorch\*                                 |
+
+
+## Performance
+
+## Inputs
+
+Name: `input` , shape: [1x3x16x224x224]. An input image sequence in the format [BxCxTxHxW], where:
+ - B - batch size
+ - C - number of channels
+ - T - duration of input clip
+ - H - image height
+ - W - image width
+
+## Outputs
+
+The model outputs a tensor with the shape [Bx100], each row is a logits vector of performed ASL gestures.
+
+## Legal Information
+[\*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/driver-action-recognition-adas-0002-decoder/model.yml b/models/intel/driver-action-recognition-adas-0002-decoder/model.yml
index 45e0455b150..e9d9b11b4db 100644
--- a/models/intel/driver-action-recognition-adas-0002-decoder/model.yml
+++ b/models/intel/driver-action-recognition-adas-0002-decoder/model.yml
@@ -13,32 +13,24 @@
 # limitations under the License.
 
 description: >-
-  This is an action recognition model for the driver monitoring use case. The
-  model uses Video Transformer approach with MobileNetv2 encoder. It is able to
-  recognize the following actions: drinking, doing hair or making up, operating
-  the radio, reaching behind, safe driving, talking on the phone, texting.
-
-  This model is only decoder part of the whole pipeline. It accepts stack of frame
-  embeddings, computed by driver-action-recognition-adas-0002-encoder, and produces
-  prediction on input video. Video frames should be sampled to cover ~1 second
-  fragment (i.e. skip every second frame in 30 fps video).
+  Video Transformer Network for driver action recognition. Decoder part
 task_type: action_recognition
 files:
   - name: FP32/driver-action-recognition-adas-0002-decoder.xml
-    size: 106382
-    sha256: 164547853128a841c710c0e8eefc09bb333ced22bf24fd0cbaf81c979c07078d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.xml
+    size: 120891
+    sha256: 94efc539bd05250ce27b5a9ed14463a415d8455fcf0b7bd13e027d1ebebd5ebf
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.xml
   - name: FP32/driver-action-recognition-adas-0002-decoder.bin
-    size: 29436112
-    sha256: 897732d7f276eabbe9f2ee8f510ce9772caad6e01a34527adef95b4fc9621058
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.bin
+    size: 29436428
+    sha256: 80deefba45d9b002c9780c9d9bcd2285b7be3f6b2ca319e2705898e725bd57c4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.bin
   - name: FP16/driver-action-recognition-adas-0002-decoder.xml
-    size: 106346
-    sha256: a4987c75564e5ae2a7a7be34c151c02c58a065ddbc8b265cd5458da969b3666f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.xml
+    size: 120851
+    sha256: 76d2fee0612c9bdb14cbbc3e8345e63cea4d09824bc6dee0b6393a82dd9effe2
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.xml
   - name: FP16/driver-action-recognition-adas-0002-decoder.bin
-    size: 14718142
-    sha256: 481760eaf84463bf8e4ca9034f1825d91658d79b946f796269dfb46e84461ce1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.bin
+    size: 14718330
+    sha256: 1a6a163af7f634d8efff026855971445056fa6bff1da48e44cd35b1ea6c4cb43
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/driver-action-recognition-adas-0002-encoder/model.yml b/models/intel/driver-action-recognition-adas-0002-encoder/model.yml
index b4c18b29c84..0d5322fab97 100644
--- a/models/intel/driver-action-recognition-adas-0002-encoder/model.yml
+++ b/models/intel/driver-action-recognition-adas-0002-encoder/model.yml
@@ -13,32 +13,24 @@
 # limitations under the License.
 
 description: >-
-  This is an action recognition model for the driver monitoring use case. The
-  model uses Video Transformer approach with MobileNetv2 encoder. It is able to
-  recognize the following actions: drinking, doing hair or making up, operating
-  the radio, reaching behind, safe driving, talking on the phone, texting.
-
-  This model is only encoder part of the whole pipeline. It accepts video frame
-  and produces embedding. Use driver-action-recognition-adas-0002-decoder to produce
-  prediction from embeddings of 16 frames. Video frames should be sampled to cover
-  ~1 second fragment (i.e. skip every second frame in 30 fps video).
+  Video Transformer Network for driver action recognition. Encoder part
 task_type: action_recognition
 files:
   - name: FP32/driver-action-recognition-adas-0002-encoder.xml
-    size: 56175
-    sha256: 3693b62b35b3646aaeeeb48712caae92c019a2e268b41094e83ef3f06d547d73
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.xml
+    size: 128346
+    sha256: 067e4067c883c6fcd5a432e3c6fb3b405f7b0d1b5857d64deaba3a70146ff2b4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.xml
   - name: FP32/driver-action-recognition-adas-0002-encoder.bin
     size: 11450776
     sha256: 12bf9bfebc74719d42bc2190bd00064ecf41b820df891040fcaa57f5eb4cffcb
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.bin
   - name: FP16/driver-action-recognition-adas-0002-encoder.xml
-    size: 56115
-    sha256: ee4da98beb4692d08f8a0e39a3e9eca7acb227825c162d1c1c23d28194f2fcd5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.xml
+    size: 128282
+    sha256: 60694a0b9f7386590d6d395f4d0f4700c2193fb01ed0cfe7e3b8cb7a041d3652
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.xml
   - name: FP16/driver-action-recognition-adas-0002-encoder.bin
     size: 5725388
     sha256: 165b34437d1c73bf5adf356ddc18fb6bb11b4d99d8db0921dd25894d886535ef
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/emotions-recognition-retail-0003/description/emotions-recognition-retail-0003.md b/models/intel/emotions-recognition-retail-0003/description/emotions-recognition-retail-0003.md
index 4faec37e67b..c7c1ab91ddc 100644
--- a/models/intel/emotions-recognition-retail-0003/description/emotions-recognition-retail-0003.md
+++ b/models/intel/emotions-recognition-retail-0003/description/emotions-recognition-retail-0003.md
@@ -1,4 +1,4 @@
-# emotion-recognition-retail-0003
+# emotions-recognition-retail-0003
 
 ## Use Case and High-Level Description
 
diff --git a/models/intel/emotions-recognition-retail-0003/model.yml b/models/intel/emotions-recognition-retail-0003/model.yml
index e23b9c3b7ea..2ff97087be3 100644
--- a/models/intel/emotions-recognition-retail-0003/model.yml
+++ b/models/intel/emotions-recognition-retail-0003/model.yml
@@ -13,33 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Fully convolutional network for recognition of five emotions ('neutral', 'happy',
-  'sad', 'surprise', 'anger').
+  Recognizes 5 emotions for a face. Targeted for Retail Audience Analytics.
 task_type: object_attributes
 files:
   - name: FP32/emotions-recognition-retail-0003.xml
-    size: 19918
-    sha256: 2410897e0990d55d85f20d88d966a3bbcfebd9656d5989df9ab580d24576e67f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.xml
+    size: 37686
+    sha256: 702e374b7dc11b369c13c2f9c5fc638c617d19a9c625eba5fdac9d190fddba41
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.xml
   - name: FP32/emotions-recognition-retail-0003.bin
     size: 9930028
     sha256: bcb9b1a910fa3cd18a638bb1dbb0597c4ef7a080d1b83008c8e8c2c3c42b99dd
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.bin
   - name: FP16/emotions-recognition-retail-0003.xml
-    size: 19899
-    sha256: aab8a191bb7e5e62cd4212d74160a219496ea7308354bb823fd8388a06642123
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.xml
+    size: 37662
+    sha256: 76ba0e171289711e1d1b8418e2bdebf4940485c6c2e0a75d2572ef7dbcee762f
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.xml
   - name: FP16/emotions-recognition-retail-0003.bin
     size: 4965014
     sha256: e62fb4b819b3b3ad8aafcd308d4353db2f164a1a31d78de6cf5970837aeb6f7b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.bin
-  - name: INT8/emotions-recognition-retail-0003.xml
-    size: 127471
-    sha256: c8e7e1aec2c483d93143053bc37e7a7edd9d5378e3d30ae64400a12c1ace4c83
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/INT8/emotions-recognition-retail-0003.xml
-  - name: INT8/emotions-recognition-retail-0003.bin
-    size: 9930028
-    sha256: 61203cb3b7318101637b444c12c9e050cb3447f682c44bc343e8926f9bfe6130
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/emotions-recognition-retail-0003/INT8/emotions-recognition-retail-0003.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.bin
+  - name: FP32-INT8/emotions-recognition-retail-0003.xml
+    size: 102858
+    sha256: 0b739388e9341f083df2d9b23506a13c234782d53e08f2e8051c0189e6e926ba
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP32-INT8/emotions-recognition-retail-0003.xml
+  - name: FP32-INT8/emotions-recognition-retail-0003.bin
+    size: 9947612
+    sha256: ff8ee9cee69cdc7043ec94522459770dfda865ff979a0c8beb73d7515f4a1df2
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/emotions-recognition-retail-0003/FP32-INT8/emotions-recognition-retail-0003.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/face-detection-adas-0001/model.yml b/models/intel/face-detection-adas-0001/model.yml
index 558ad139344..f641e646782 100644
--- a/models/intel/face-detection-adas-0001/model.yml
+++ b/models/intel/face-detection-adas-0001/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Face detector for driver monitoring and similar scenarios. The network features
-  a default MobileNet backbone that includes depth-wise convolutions to reduce
-  the amount of computation for the 3x3 convolution block.
+  Face Detection (MobileNet with reduced channels + SSD with weights sharing)
 task_type: detection
 files:
   - name: FP32/face-detection-adas-0001.xml
-    size: 89640
-    sha256: 4a567a086ce60e87868469161cb99e4a50d436a6eeb93c689a676a8bc268c8c6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/FP32/face-detection-adas-0001.xml
+    size: 232998
+    sha256: 62b4bf7dead77e16a47428b541aa4f3c506cdf3c7e31a317aa75771dd907557c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP32/face-detection-adas-0001.xml
   - name: FP32/face-detection-adas-0001.bin
-    size: 4211988
-    sha256: 0e8fd765cfac0dc369373d456cad17aab0b6c1534f6de33398f89946aa04c673
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/FP32/face-detection-adas-0001.bin
+    size: 4212072
+    sha256: 85a9334e031289692884e2aefbcb4ca401b003a3f25ff4dd0e669ba32f98cc0b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP32/face-detection-adas-0001.bin
   - name: FP16/face-detection-adas-0001.xml
-    size: 89603
-    sha256: 00297f4b8a79d36142784dd3ee442ee5867c163b14fbe6b2c6e74cabc48a7e41
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/FP16/face-detection-adas-0001.xml
+    size: 232967
+    sha256: c0b9d34eba1fe6c76755fada4dc65634068eddf343a219b501ac71439348eac1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP16/face-detection-adas-0001.xml
   - name: FP16/face-detection-adas-0001.bin
-    size: 2106000
-    sha256: e4d1ca072f26173321e580168d6b066eac5123cee136093fca492b2a0cf18cbc
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/FP16/face-detection-adas-0001.bin
-  - name: INT8/face-detection-adas-0001.xml
-    size: 3357740
-    sha256: 64b64a2180b3d9bf8619adc0fb173c045ead6bcf043aa56a9f0703c67bea77fa
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/INT8/face-detection-adas-0001.xml
-  - name: INT8/face-detection-adas-0001.bin
-    size: 4211988
-    sha256: 69650c48ce9ab68928397eb15f6fd8a41f0f9259098623c962720bbfaeb906a1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-0001/INT8/face-detection-adas-0001.bin
+    size: 2106088
+    sha256: df0f5799d801c6afb355d1c4771693c782efbb58d2eb2238982eac8fe84bc821
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP16/face-detection-adas-0001.bin
+  - name: FP32-INT8/face-detection-adas-0001.xml
+    size: 503962
+    sha256: 8959f287e3caf098948b2faee40d67e019c4b794948476fcdc8a28e58cb79125
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP32-INT8/face-detection-adas-0001.xml
+  - name: FP32-INT8/face-detection-adas-0001.bin
+    size: 4291532
+    sha256: d3ffb0da33361253d4027def5acddf104a6919c920582f084974a4f9d8529ffd
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-0001/FP32-INT8/face-detection-adas-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md b/models/intel/face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md
index b07e5034df8..253339d5ddf 100644
--- a/models/intel/face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md
+++ b/models/intel/face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md
@@ -23,7 +23,7 @@ are binary that can be implemented using effective binary XNOR+POPCOUNT approach
 | GFlops                          | 0.611                 |
 | GI1ops                          | 2.224                 |
 | MParams                         | 1.053                 |
-| Source framework                | Pytorch*              |
+| Source framework                | PyTorch*              |
 
 Average Precision (AP) is defined as an area under the
 [precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall)
diff --git a/models/intel/face-detection-adas-binary-0001/model.yml b/models/intel/face-detection-adas-binary-0001/model.yml
index c5ac6d27b8d..12a5c01f4e0 100644
--- a/models/intel/face-detection-adas-binary-0001/model.yml
+++ b/models/intel/face-detection-adas-binary-0001/model.yml
@@ -13,19 +13,17 @@
 # limitations under the License.
 
 description: >-
-  Face detector for driver monitoring and similar scenarios. The network features
-  a pruned MobileNet backbone that includes depth-wise convolutions to reduce
-  the amount of computation for the 3x3 convolution block. Also some 1x1 convolutions
-  are binary that can be implemented using effective binary XNOR+POPCOUNT approach
+  Face Detection (MobileNet with reduced channels and binary convolution + SSD with
+  weights sharing)
 task_type: detection
 files:
-  - name: INT1/face-detection-adas-binary-0001.xml
+  - name: FP32-INT1/face-detection-adas-binary-0001.xml
     size: 116647
     sha256: fde8c465a5e3f3425fb567d31b9591ff8be589930c8488639f8feddf7f0301f2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-binary-0001/INT1/face-detection-adas-binary-0001.xml
-  - name: INT1/face-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-binary-0001/FP32-INT1/face-detection-adas-binary-0001.xml
+  - name: FP32-INT1/face-detection-adas-binary-0001.bin
     size: 1840444
     sha256: 0e0742b61fb924e937a8974da8a2e15cc6afc15630afa3f220676ee7a3a99700
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-adas-binary-0001/INT1/face-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-adas-binary-0001/FP32-INT1/face-detection-adas-binary-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/face-detection-retail-0004/model.yml b/models/intel/face-detection-retail-0004/model.yml
index e2a818e40c5..ead8138e389 100644
--- a/models/intel/face-detection-retail-0004/model.yml
+++ b/models/intel/face-detection-retail-0004/model.yml
@@ -13,35 +13,33 @@
 # limitations under the License.
 
 description: >-
-  Face detector based on SqueezeNet light (half-channels) as a backbone with a
-  single SSD for indoor/outdoor scenes shot by a front-facing camera. The backbone
-  consists of fire modules to reduce the number of computations. The single SSD
-  head from 1/16 scale feature map has nine clustered prior boxes.
+  Face Detection (SqNet1.0modif+single scale) without BatchNormalization trained with
+  negatives.
 task_type: detection
 files:
   - name: FP32/face-detection-retail-0004.xml
-    size: 48102
-    sha256: 4c818c7db9672318f77d1b86e36858ed46880d2c04808348903854b467de9280
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/FP32/face-detection-retail-0004.xml
+    size: 101815
+    sha256: 81d31d708214bb4dd4dcef469fa18c611ad5c3f88447ba0986963696cfad8401
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.xml
   - name: FP32/face-detection-retail-0004.bin
-    size: 2352892
-    sha256: a066b383f7b59055326f4facaef34c6669d8cb2cb817f98b8517fa6cebfb6f41
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/FP32/face-detection-retail-0004.bin
+    size: 2352984
+    sha256: 89349ce12dd21c5263fb302cd3ffd4b73c35ea12ed98aff863d03a2cf3a32464
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32/face-detection-retail-0004.bin
   - name: FP16/face-detection-retail-0004.xml
-    size: 48060
-    sha256: 89ef76b87feed5663dc16d8975bee55fa59c6ac89dd6e58199ee42256ee4302e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/FP16/face-detection-retail-0004.xml
+    size: 101773
+    sha256: 7e8e76df3b70ac24967f625f096b1a9c6f2474e099e94210b177be0a5175e521
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP16/face-detection-retail-0004.xml
   - name: FP16/face-detection-retail-0004.bin
-    size: 1176452
-    sha256: d20f133227037747343eb635c004679cb25f10acf5e823de72888f64d99ff77a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/FP16/face-detection-retail-0004.bin
-  - name: INT8/face-detection-retail-0004.xml
-    size: 738371
-    sha256: e961e827f8535eea607691382204569214162fa844f3e5ba4380e6ca0e874098
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/INT8/face-detection-retail-0004.xml
-  - name: INT8/face-detection-retail-0004.bin
-    size: 2352892
-    sha256: ea68f90c1b55b70fe0c4e356b5469177a08981c4c71ad27532a1151ee7407430
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0004/INT8/face-detection-retail-0004.bin
+    size: 1176544
+    sha256: ab7def342edab22e69ba1ef4e971983ea4e0f337c43b0a49c7ef3a7627f6cf1a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP16/face-detection-retail-0004.bin
+  - name: FP32-INT8/face-detection-retail-0004.xml
+    size: 231496
+    sha256: 4bac1bae22ab8f34c15a7504bd97ce3e57a71a5b63ec08435a1bdf180b38ab18
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32-INT8/face-detection-retail-0004.xml
+  - name: FP32-INT8/face-detection-retail-0004.bin
+    size: 2372492
+    sha256: f696f0651da3cf3b07915356fa6f7332dde671ac51b26e3be8209df3d7f7e5e0
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0004/FP32-INT8/face-detection-retail-0004.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/face-detection-retail-0005/model.yml b/models/intel/face-detection-retail-0005/model.yml
index 523e986ce4b..eaa6461d12e 100644
--- a/models/intel/face-detection-retail-0005/model.yml
+++ b/models/intel/face-detection-retail-0005/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Face detector based on MobileNetV2 as a backbone with a single SSD head for
-  indoor/outdoor scenes shot by a front-facing camera. The single SSD head from
-  1/16 scale feature map has nine clustered prior boxes.
+  Face Detection based on MobileNetV2.
 task_type: detection
 files:
   - name: FP32/face-detection-retail-0005.xml
-    size: 64728
-    sha256: 1b3ebaee6ef1be7d053941de42e4cf9c06448008671a682c7cde0b00450b951a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/FP32/face-detection-retail-0005.xml
+    size: 145896
+    sha256: 2a105498942571686ac856a6dcbe9ef33b54039d69bb861f5d3a98b58bbef016
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP32/face-detection-retail-0005.xml
   - name: FP32/face-detection-retail-0005.bin
-    size: 4083044
-    sha256: e5d2d463fe3b11fc99a77fe23d1daaa497309e73eca222be02bed99d0601115b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/FP32/face-detection-retail-0005.bin
+    size: 4083132
+    sha256: bc174f03f2314bdbb7e1abfb5136ccb34507d8225f87b040c5a77493f1a6c307
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP32/face-detection-retail-0005.bin
   - name: FP16/face-detection-retail-0005.xml
-    size: 64647
-    sha256: 2a0e4c1197550019fe0a2e6b2b5fb4d686df5af5c7dd4f0e4d0edb932b76bc0b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/FP16/face-detection-retail-0005.xml
+    size: 145815
+    sha256: 72732d512f311ab1fc96d76c5caaf253e84a944fb0899fc5bf3e4cdbebf2f827
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP16/face-detection-retail-0005.xml
   - name: FP16/face-detection-retail-0005.bin
-    size: 2041532
-    sha256: aee37d488af499cd89382ab5632449fce5985660c639217494ae9b64ede7d07e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/FP16/face-detection-retail-0005.bin
-  - name: INT8/face-detection-retail-0005.xml
-    size: 1523176
-    sha256: fc761031609459a65816538405a94112e4d72b54fe9f5fc06d10f20041501411
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/INT8/face-detection-retail-0005.xml
-  - name: INT8/face-detection-retail-0005.bin
-    size: 4083060
-    sha256: 27dd6d53eb97198e9e94508802d47b02393c2deef7a2eebab72c1bdf05f26fb4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-detection-retail-0005/INT8/face-detection-retail-0005.bin
+    size: 2041618
+    sha256: fef3746455eec3d1e69730b556809a225a4f714b6bc0b4bacfe5c7bb1a944105
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP16/face-detection-retail-0005.bin
+  - name: FP32-INT8/face-detection-retail-0005.xml
+    size: 414518
+    sha256: bfe8445ef8005454f9d2d9d5857c0e9de37c3e9dd474d6fb8882a32e2461e138
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP32-INT8/face-detection-retail-0005.xml
+  - name: FP32-INT8/face-detection-retail-0005.bin
+    size: 4214360
+    sha256: 0525d556261936e710d8b540f540718869e36c2e7347ee111dd68c259f6e5d54
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-detection-retail-0005/FP32-INT8/face-detection-retail-0005.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/face-reidentification-retail-0095/model.yml b/models/intel/face-reidentification-retail-0095/model.yml
index b47c5ab3e09..f52b68f8e1f 100644
--- a/models/intel/face-reidentification-retail-0095/model.yml
+++ b/models/intel/face-reidentification-retail-0095/model.yml
@@ -13,30 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a lightweight network for the face re-identification scenario. It is
-  based on MobileNet V2 backbone, which consists of 3x3 inverted residual blocks
-  with squeeze-excitation attention modules. Instead of the ReLU6 activations
-  used in the original MobileNet V2, this network uses PReLU ones. After the backbone,
-  the network applies global depthwise pooling and then uses 1x1 convolution to
-  create the final embedding vector. The model produces feature vectors which
-  should be close in cosine distance for similar faces and far for different faces.
+  Single embedding-based face verification model
 task_type: face_recognition
 files:
   - name: FP32/face-reidentification-retail-0095.xml
-    size: 106214
-    sha256: 928396efb2af1dce2bc8a553c884852423a8d42b6a72c8904e7c57e1117bbbd4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-reidentification-retail-0095/FP32/face-reidentification-retail-0095.xml
+    size: 225832
+    sha256: 3d0c0bebecb1d138dff373124d63e9baaa97b0259992f8741eb581d50c43b156
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP32/face-reidentification-retail-0095.xml
   - name: FP32/face-reidentification-retail-0095.bin
     size: 4427256
     sha256: 03836a6a1d03828322491b0608a579b1c47e5097d355c489b5b8aaf5fce1ef48
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-reidentification-retail-0095/FP32/face-reidentification-retail-0095.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP32/face-reidentification-retail-0095.bin
   - name: FP16/face-reidentification-retail-0095.xml
-    size: 106110
-    sha256: 0f13f0f9724c596774326be0c13dec8792dc0196b3d3da728938916e7dc8df21
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-reidentification-retail-0095/FP16/face-reidentification-retail-0095.xml
+    size: 225728
+    sha256: b8677b046dacd91a9ea0dfe388a7d58701fc09dfd8388716342da406078633b0
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP16/face-reidentification-retail-0095.xml
   - name: FP16/face-reidentification-retail-0095.bin
-    size: 2213628
-    sha256: 3289078133e40e4263f682ded2a26a500905abb0fd7b943f41ca8037a4f3fe21
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/face-reidentification-retail-0095/FP16/face-reidentification-retail-0095.bin
+    size: 2213724
+    sha256: c2f8a7b9268e5b5236574d6fda2216df43c03acaa39c078848a98fbb707ae0a3
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP16/face-reidentification-retail-0095.bin
+  - name: FP32-INT8/face-reidentification-retail-0095.xml
+    size: 643466
+    sha256: 6814d50c0ef1339d28447ffdd47335540a8d910bc8494c6afc185983f34bd466
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP32-INT8/face-reidentification-retail-0095.xml
+  - name: FP32-INT8/face-reidentification-retail-0095.bin
+    size: 4551656
+    sha256: eaae8881109a2dab91fb7fddc73052378b015d6f3aa61b1c772eca21f87e4741
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/face-reidentification-retail-0095/FP32-INT8/face-reidentification-retail-0095.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/facial-landmarks-35-adas-0002/model.yml b/models/intel/facial-landmarks-35-adas-0002/model.yml
index 38f67a97f10..cd8b09099af 100644
--- a/models/intel/facial-landmarks-35-adas-0002/model.yml
+++ b/models/intel/facial-landmarks-35-adas-0002/model.yml
@@ -13,25 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a custom-architecture convolutional neural network for 35 facial landmarks
-  estimation.
+  Custom-architecture convolutional neural network for 35 facial landmarks estimation.
 task_type: object_attributes
 files:
   - name: FP32/facial-landmarks-35-adas-0002.xml
-    size: 110860
-    sha256: e3eee579bf6c46ba8120e97bd824052f813bd08667b6ec64873a34a4feb1d6b4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.xml
+    size: 237139
+    sha256: 4cb90657a60311184f3505ef973563180729bb7e8d5a2f6a42f9109c1af7bfdb
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.xml
   - name: FP32/facial-landmarks-35-adas-0002.bin
-    size: 18381136
-    sha256: 232b1a25de480227f36428fdb11a7a1f623acf37eb4232ced5fabac9b7dd2ad7
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.bin
+    size: 18381152
+    sha256: bd41c25201c2ea688a75549c11b9e10aa98e51dcc5a6dd783e84cdcf55a1011e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.bin
   - name: FP16/facial-landmarks-35-adas-0002.xml
-    size: 110724
-    sha256: c9527dc629e02544858a1cd05feb5bed9fcba48e67d8d34a6ddf4f6481fd8e31
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.xml
+    size: 237002
+    sha256: 702d476efcab1e89519ff14b76812c61cd5123f86f5fc343512fa416a9a94e27
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.xml
   - name: FP16/facial-landmarks-35-adas-0002.bin
-    size: 9190568
-    sha256: b8945ba897072289c8cb44357bd211e728ecd1c093c1d4777b79d118a19ab58a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.bin
+    size: 9190584
+    sha256: 88a2064849da0e6a31557f489ca4d652aa99e5a9676da0c5c857ee5d8cc26fe4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.bin
+  - name: FP32-INT8/facial-landmarks-35-adas-0002.xml
+    size: 588492
+    sha256: d41ba7372ca2db93bd269db32567022109d3e2a9b7aed3da0ef1e8e021f95be2
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP32-INT8/facial-landmarks-35-adas-0002.xml
+  - name: FP32-INT8/facial-landmarks-35-adas-0002.bin
+    size: 18441156
+    sha256: f81ebf7c25f30138c2fa44530f51f516783ea790c5b6cacbaa5b31d95c73cbb7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/facial-landmarks-35-adas-0002/FP32-INT8/facial-landmarks-35-adas-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/gaze-estimation-adas-0002/description/gaze-estimation-adas-0002.md b/models/intel/gaze-estimation-adas-0002/description/gaze-estimation-adas-0002.md
index 67f97aa0cbb..214d22de893 100644
--- a/models/intel/gaze-estimation-adas-0002/description/gaze-estimation-adas-0002.md
+++ b/models/intel/gaze-estimation-adas-0002/description/gaze-estimation-adas-0002.md
@@ -9,7 +9,7 @@ This is a custom VGG-like convolutional neural network for gaze direction estima
 
 ![](./ill_for_gaze.png)
 
-The network takes three inputs: square crop of left eye image, square crop of right eye image, and three head pose angles -- (yaw, pitch, and roll) (see figure). The network outputs 3-D vector corresponding to the direction of a person’s gaze in a Cartesian coordinate system in which z-axis is directed from person’s eyes (mid-point between left and right eyes’ centers) to the camera center, y-axis is vertical, and x-axis is orthogonal to both z,y axes so that (x,y,z) constitute a right-handed coordinate system.
+The network takes three inputs: square crop of left eye image, square crop of right eye image, and three head pose angles -- (yaw, pitch, and roll) (see figure). The network outputs 3-D vector corresponding to the direction of a person's gaze in a Cartesian coordinate system in which z-axis is directed from person's eyes (mid-point between left and right eyes' centers) to the camera center, y-axis is vertical, and x-axis is orthogonal to both z,y axes so that (x,y,z) constitute a right-handed coordinate system.
 
 ## Specification
 
diff --git a/models/intel/gaze-estimation-adas-0002/model.yml b/models/intel/gaze-estimation-adas-0002/model.yml
index ff085a1be88..ec563cf7547 100644
--- a/models/intel/gaze-estimation-adas-0002/model.yml
+++ b/models/intel/gaze-estimation-adas-0002/model.yml
@@ -13,32 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a custom VGG-like convolutional neural network for gaze direction estimation.
+  Gaze estimation for ADAS
 task_type: object_attributes
 files:
   - name: FP32/gaze-estimation-adas-0002.xml
-    size: 27546
-    sha256: 7aa055a1e660121be6fb7fa0c22368446046111b43ae5815e19f775dbb30eac5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.xml
+    size: 63632
+    sha256: c676d6d02a128a7496ea8c93d15ffe10697e4171e64d164f4e90e659a2dbea6b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.xml
   - name: FP32/gaze-estimation-adas-0002.bin
-    size: 7529292
-    sha256: 0c73b93bc4162b61a4abf6f1decc892f769e9c289de86793673dc0a723b84652
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.bin
+    size: 7529308
+    sha256: df935569980ab2654c46463fccb0ecc9ddd90423dcee85b3f933aa375baa15cf
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.bin
   - name: FP16/gaze-estimation-adas-0002.xml
-    size: 27505
-    sha256: 6f7cd2bede647667d4699a9e22c1330967868fa13c4764ff89b09e3ca0db6964
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.xml
+    size: 63591
+    sha256: daba62fae98a3719b8c95e5c821287ff0bb43b99d4c52e45e2615f6c88ffa67c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.xml
   - name: FP16/gaze-estimation-adas-0002.bin
-    size: 3764654
-    sha256: 01acb7d0a596f1a691e6f36235fab07b99bcab9d97b9b8fb545ea1d1a27db3b0
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.bin
-  - name: INT8/gaze-estimation-adas-0002.xml
-    size: 143904
-    sha256: 45812fe1983c4f5b9293170f409d3713b8509aede1e3e4639d85e068a18ef2e9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/INT8/gaze-estimation-adas-0002.xml
-  - name: INT8/gaze-estimation-adas-0002.bin
-    size: 7529308
-    sha256: ac281130aab7eb4a69a59520a483301b3cfe3d385402bfdec5640941fc1433f7
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/gaze-estimation-adas-0002/INT8/gaze-estimation-adas-0002.bin
+    size: 3764670
+    sha256: 03fa9ec80b6edf2ff6bfe5208e1fa13f17be534b80461de7e91b70f0ec1bcf85
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.bin
+  - name: FP32-INT8/gaze-estimation-adas-0002.xml
+    size: 142699
+    sha256: 1a2a07f51c29e6b2282e183baf3820fe434a8f009cb71bb274fdb5e5d21c4ed6
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP32-INT8/gaze-estimation-adas-0002.xml
+  - name: FP32-INT8/gaze-estimation-adas-0002.bin
+    size: 7542172
+    sha256: 0254e6bacc23912ba647a626ebe9e4562e8b824ab157442714dbf2e3d13d4996
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/gaze-estimation-adas-0002/FP32-INT8/gaze-estimation-adas-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/handwritten-score-recognition-0003/model.yml b/models/intel/handwritten-score-recognition-0003/model.yml
index a430579a194..257ba5abcb7 100644
--- a/models/intel/handwritten-score-recognition-0003/model.yml
+++ b/models/intel/handwritten-score-recognition-0003/model.yml
@@ -13,27 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is a network for text recognition scenario. It consists of VGG16-like backbone
-  and bidirectional LSTM encoder-decoder. The network is able to recognize school
-  marks that should have format either `<digit>` or `<digit>.<digit>` (e.g. `4`
-  or `3.5`).
+  Recognizes school marks (e.g '4' or '3.5'). Alphabet is '0123456789._'. Architecture:
+  VGG-like + BiLSTM as an encoder -  BiLSTM as a decoder.
 task_type: optical_character_recognition
 files:
   - name: FP32/handwritten-score-recognition-0003.xml
-    size: 41876
-    sha256: 16b69c46a99f5bc6d05c7d08e1170cc7f7f7a051e3ca156ced906b0560dcd2ee
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.xml
+    size: 80600
+    sha256: 2136bb229ad044d354dc03591b35462989d92ff7716fb1cf30ba83748d162c5a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.xml
   - name: FP32/handwritten-score-recognition-0003.bin
-    size: 41121868
-    sha256: 56dc7bf776b712be477417ec153f34af57f31444d40772f181889544334c67e1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.bin
+    size: 41121956
+    sha256: 55350eecb10ea7c95b495a44dcd78b8287e124abed4689956aea23bff062b8ff
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.bin
   - name: FP16/handwritten-score-recognition-0003.xml
-    size: 41857
-    sha256: 1aaa04c37887ac21d6bad7e8ae03ec02ebf32a338a762e42fe68b1456982645a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.xml
+    size: 80575
+    sha256: 287586935587d49032a94322f345fc36f356c1b34b3af2b87ba1da23b08b5427
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.xml
   - name: FP16/handwritten-score-recognition-0003.bin
-    size: 20560946
-    sha256: 4d7d4df0bd8e69fbf9a3d3d34cf2d1e0df1abe201f8d083457cd3ab8f5402d92
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.bin
+    size: 20561030
+    sha256: b19f78f990bbfd7d86c52c075a094a18578de3243b5d531692bf8bd9afd4d9f4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.bin
+  - name: FP32-INT8/handwritten-score-recognition-0003.xml
+    size: 114475
+    sha256: 88c6c1bdaa04ac926ef851d4284543a0ba71334e0fe573a3ca314a967d139476
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP32-INT8/handwritten-score-recognition-0003.xml
+  - name: FP32-INT8/handwritten-score-recognition-0003.bin
+    size: 41140544
+    sha256: c0bb0af31e9657fa36f7ed9094b8ef9c2fb0f1d03576a2ebe6751ba3e072622d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/handwritten-score-recognition-0003/FP32-INT8/handwritten-score-recognition-0003.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/head-pose-estimation-adas-0001/description/head-pose-estimation-adas-0001.md b/models/intel/head-pose-estimation-adas-0001/description/head-pose-estimation-adas-0001.md
index 9ad37caaa6d..c8db65f4008 100644
--- a/models/intel/head-pose-estimation-adas-0001/description/head-pose-estimation-adas-0001.md
+++ b/models/intel/head-pose-estimation-adas-0001/description/head-pose-estimation-adas-0001.md
@@ -53,7 +53,7 @@ Output layer names in Caffe* format:
 
 
 Each output contains one float value that represents value in Tait-Bryan angles
-(yaw, pitсh or roll).
+(yaw, pitch or roll).
 
 ## Legal Information
 [*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/head-pose-estimation-adas-0001/model.yml b/models/intel/head-pose-estimation-adas-0001/model.yml
index 451aec65bd8..877d1b3b53e 100644
--- a/models/intel/head-pose-estimation-adas-0001/model.yml
+++ b/models/intel/head-pose-estimation-adas-0001/model.yml
@@ -13,26 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Head pose estimation network based on simple, handmade CNN architecture. Angle
-  regression layers are convolutions + ReLU + batch norm + fully connected with
-  one output.
+  Vanilla CNN trained from scratch yaw + pitch + roll + landmarks
 task_type: head_pose_estimation
 files:
   - name: FP32/head-pose-estimation-adas-0001.xml
-    size: 18290
-    sha256: 01d23643c35ebf63b62d88216936fd77214c7a90684af162b0c7f6b75bf4eb84
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.xml
+    size: 50622
+    sha256: 5e0994e906aff30241441e0910e3527ca6d8ca0d756457adb34e53d418016cc7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.xml
   - name: FP32/head-pose-estimation-adas-0001.bin
-    size: 7645540
-    sha256: e4047e643bd39d97288dc5d22abe8ead850e05ac1bc44605443bbb2abfc2e246
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.bin
+    size: 7647604
+    sha256: a9110b175f7cb082049d5fcd4c48825e9c00688901aecb22fa70c2535aff282c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.bin
   - name: FP16/head-pose-estimation-adas-0001.xml
-    size: 18279
-    sha256: 7ac8b562cba4bda2390dbdf0c0055e888fb47b7ae4b73b9a180b4e354fd186b1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.xml
+    size: 50610
+    sha256: f98f34ff5b2382c7c9185ac3aa8a329db268c9f9d93eb40c385f5812e1ef3913
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.xml
   - name: FP16/head-pose-estimation-adas-0001.bin
-    size: 3822770
-    sha256: 535a6af806999e22cca5e4071e55841a694a6b60370a6f8fb3b9d0cda5f81c41
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.bin
+    size: 3823810
+    sha256: e37b71a654656a78d4014ae8e46baab83a9c06a41df5f5c5122e9bbee46a63f2
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.bin
+  - name: FP32-INT8/head-pose-estimation-adas-0001.xml
+    size: 81656
+    sha256: c5697706a3cf57386e626bb5c666c737373a18379e20f0ae135fa5eb4404a1be
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP32-INT8/head-pose-estimation-adas-0001.xml
+  - name: FP32-INT8/head-pose-estimation-adas-0001.bin
+    size: 7657904
+    sha256: 460e2160619fce6e9986e99130c55468e95e0364f7907fb339555807029da296
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/head-pose-estimation-adas-0001/FP32-INT8/head-pose-estimation-adas-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/human-pose-estimation-0001/description/human-pose-estimation-0001.md b/models/intel/human-pose-estimation-0001/description/human-pose-estimation-0001.md
index c7597944845..c80bbf228ef 100644
--- a/models/intel/human-pose-estimation-0001/description/human-pose-estimation-0001.md
+++ b/models/intel/human-pose-estimation-0001/description/human-pose-estimation-0001.md
@@ -2,7 +2,9 @@
 
 ## Use Case and High-Level Description
 
-This is a multi-person 2D pose estimation network (based on the OpenPose approach) with tuned MobileNet v1 as a feature extractor. It finds a human pose: body skeleton, which consists of keypoints and connections between them, for every person inside image. The pose may contain up to 18 keypoints: ears, eyes, nose, neck, shoulders, elbows, wrists, hips, knees and ankles.
+This is a multi-person 2D pose estimation network (based on the OpenPose approach) with tuned MobileNet v1 as a feature extractor. 
+For every person in an image, the network detects a human pose: a body skeleton consisting of keypoints and connections between them.
+The pose may contain up to 18 keypoints: ears, eyes, nose, neck, shoulders, elbows, wrists, hips, knees, and ankles.
 
 ## Example
 
@@ -19,13 +21,13 @@ This is a multi-person 2D pose estimation network (based on the OpenPose approac
 
 Average Precision metric described in [COCO Keypoint Evaluation site](http://cocodataset.org/#keypoints-eval).
 
-Tested on a COCO validation subset from the original paper: Cao et al. ["Realtime Multi-Person 2D Pose Estimation using Part Affinity Fields"](https://arxiv.org/pdf/1611.08050.pdf).
+Tested on a COCO validation subset from the original paper [Realtime Multi-Person 2D Pose Estimation using Part Affinity Fields](https://arxiv.org/pdf/1611.08050.pdf).
 
 ## Performance
 
 ## Inputs
 
-1. name: "input" , shape: [1x3x256x456] - An input image in the format [BxCxHxW],
+1. Name: `input` , shape: [1x3x256x456]. An input image in the [BxCxHxW] format ,
   where:
     - B - batch size
     - C - number of channels
@@ -35,7 +37,7 @@ Tested on a COCO validation subset from the original paper: Cao et al. ["Realtim
 
 ## Outputs
 
-1. The net outputs two blobs with shapes: [1, 38, 32, 57] and [1, 19, 32, 57]. The first blob contains keypoint pairwise relations (part affinity fields), the second one contains keypoint heatmaps.
+The net outputs two blobs with the [1, 38, 32, 57] and [1, 19, 32, 57] shapes. The first blob contains keypoint pairwise relations (part affinity fields), while the second blob contains keypoint heatmaps.
 
 ## Legal Information
 [*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/human-pose-estimation-0001/model.yml b/models/intel/human-pose-estimation-0001/model.yml
index 2d459850605..c93d49c125b 100644
--- a/models/intel/human-pose-estimation-0001/model.yml
+++ b/models/intel/human-pose-estimation-0001/model.yml
@@ -13,36 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a multi-person 2D pose estimation network (based on the OpenPose approach)
-  with tuned MobileNet v1 as a feature extractor. It finds a human pose: body
-  skeleton, which consists of keypoints and connections between them, for every
-  person inside image. The pose may contain up to 18 keypoints: ears, eyes, nose,
-  neck, shoulders, elbows, wrists, hips, knees and ankles.
+  2D human pose estimation with tuned mobilenet backbone (based on OpenPose).
 task_type: human_pose_estimation
 files:
   - name: FP32/human-pose-estimation-0001.xml
-    size: 66630
-    sha256: 48c77d491a52b2c08f107a5acdb3093293081de37fc5e5fd827a8c905e56e342
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/FP32/human-pose-estimation-0001.xml
+    size: 143782
+    sha256: 4d2cc5d3a8c395affa74ae640a63ba9bae9bd5871527d65f62a87cc5b40831e9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP32/human-pose-estimation-0001.xml
   - name: FP32/human-pose-estimation-0001.bin
-    size: 16394720
-    sha256: 9790da47abf072c509ff843695a7b9b96283729731ba4d711fb50201f376b2fc
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/FP32/human-pose-estimation-0001.bin
+    size: 16394712
+    sha256: 1cd32cb5f9f4633b8ee1451144f749ddd75038c4c5fe862e704e489908b79a78
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP32/human-pose-estimation-0001.bin
   - name: FP16/human-pose-estimation-0001.xml
-    size: 66557
-    sha256: 6ccb526cfe58f6f05abb0997831eb24d8dd8cb3bd07791387bcd55aedc5e4a66
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/FP16/human-pose-estimation-0001.xml
+    size: 143706
+    sha256: 75bda095e6fa1b1c118e085c4e5f4be9d9d9db512578fd6ec57b3113d5b42dae
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP16/human-pose-estimation-0001.xml
   - name: FP16/human-pose-estimation-0001.bin
-    size: 8197360
-    sha256: 48c607a55b22b540c38b6ed295eba211aaa6cd4acd47776f0a1259829cb51196
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/FP16/human-pose-estimation-0001.bin
-  - name: INT8/human-pose-estimation-0001.xml
-    size: 610556
-    sha256: 1bd2a7c8e36fd7a5ae7ea9f3489d0b995b666407cff3883217235900a1078330
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/INT8/human-pose-estimation-0001.xml
-  - name: INT8/human-pose-estimation-0001.bin
-    size: 16394720
-    sha256: 0d252f0fd98c598fb38eaa907fa8b3d15cf2d420d743649b4b6c5dbdbbe5f1ac
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/human-pose-estimation-0001/INT8/human-pose-estimation-0001.bin
+    size: 8197356
+    sha256: c1c828d5d1ea2b03035692a8600f06d787fe1a20e79dac159c4293ed7063a382
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP16/human-pose-estimation-0001.bin
+  - name: FP32-INT8/human-pose-estimation-0001.xml
+    size: 408100
+    sha256: 6e22b77c4e5f2c39bb14603c3bfa2d902210a3fdb3fe89443eab5fb149c3a470
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP32-INT8/human-pose-estimation-0001.xml
+  - name: FP32-INT8/human-pose-estimation-0001.bin
+    size: 16513820
+    sha256: 482635ee949716049bd7dd5a69ab66a6d5f29a5cc86598c0369035be2d1fa274
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/human-pose-estimation-0001/FP32-INT8/human-pose-estimation-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/image-retrieval-0001/model.yml b/models/intel/image-retrieval-0001/model.yml
index f251e187aae..da44b50f09a 100644
--- a/models/intel/image-retrieval-0001/model.yml
+++ b/models/intel/image-retrieval-0001/model.yml
@@ -13,26 +13,33 @@
 # limitations under the License.
 
 description: >-
-  `image-retrieval-0001` is an image retrieval model based on Mobilenet v2 as
-  a backbone. The model produces l2-normalized embeddings with dimension that
-  equals to 256.
+  An image retrieval model based on Mobilenet v2 as a backbone. The model produces
+  l2-normalized embeddings with dimension equals to 256.
 task_type: object_attributes
 files:
   - name: FP32/image-retrieval-0001.xml
-    size: 65666
-    sha256: ae46340eaa2848f7feed8f33431cacf1c94d310eb968efd4c9c878b96f707a92
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/image-retrieval-0001/FP32/image-retrieval-0001.xml
+    size: 139941
+    sha256: 9ccf302bde086b4173f6214fce186c50c59f45f0d90e42cdeb887bdba5d69320
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP32/image-retrieval-0001.xml
   - name: FP32/image-retrieval-0001.bin
-    size: 10140104
-    sha256: 3826d08fd7968e002ca2a8d880840622e925eb000b343518b709b24151d2aeeb
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/image-retrieval-0001/FP32/image-retrieval-0001.bin
+    size: 10139176
+    sha256: 337b7602546e34877bdaba7b7a873698dd1ca46265ef8c0c83b2531f360293f8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP32/image-retrieval-0001.bin
   - name: FP16/image-retrieval-0001.xml
-    size: 65601
-    sha256: b6c148e05d0e06b6ef32d8d8264b2c637f66416cb7b819847804492c67b7df26
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/image-retrieval-0001/FP16/image-retrieval-0001.xml
+    size: 139875
+    sha256: bdbd7fb3700cf8e44853c03bd489cfb9b5ef3fd50828ce5cace938fbebf0218e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP16/image-retrieval-0001.xml
   - name: FP16/image-retrieval-0001.bin
-    size: 5070076
-    sha256: 79d272e74b68f00987447080527a3dbe30dde8ca82acce1f031cbb68b6e61ad2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/image-retrieval-0001/FP16/image-retrieval-0001.bin
+    size: 5069656
+    sha256: 638931867ab133c8c6b0fa659a19b12d5b9ac6ce52f72b961f1d35e8ff812edd
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP16/image-retrieval-0001.bin
+  - name: FP32-INT8/image-retrieval-0001.xml
+    size: 402526
+    sha256: 506c619a98d1de256a5a179cd7d086a9cd340de3ef045acba9dfa4cf2b8863d8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP32-INT8/image-retrieval-0001.xml
+  - name: FP32-INT8/image-retrieval-0001.bin
+    size: 10316580
+    sha256: 8247914522e23c4ca8c291f59d6cb4d29dc780121fbc79eb8e02052eeb1796fc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/image-retrieval-0001/FP32-INT8/image-retrieval-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/inceptionv3-int8-sparse-v1-tf-0001/description/inceptionv3-int8-sparse-v1-tf-0001.md b/models/intel/inceptionv3-int8-sparse-v1-tf-0001/description/inceptionv3-int8-sparse-v1-tf-0001.md
deleted file mode 100644
index c8f2c695c80..00000000000
--- a/models/intel/inceptionv3-int8-sparse-v1-tf-0001/description/inceptionv3-int8-sparse-v1-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# inceptionv3-int8-sparse-v1-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Inception v3 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **30.9%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x299x299x3" in BGR order.
-
-The model output for `inceptionv3-int8-sparse-v1-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 11.469        |
-| MParams           | 23.819        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 78.65% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        78.65% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,299,299,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/inceptionv3-int8-sparse-v1-tf-0001/model.yml b/models/intel/inceptionv3-int8-sparse-v1-tf-0001/model.yml
deleted file mode 100644
index a19f8de96f3..00000000000
--- a/models/intel/inceptionv3-int8-sparse-v1-tf-0001/model.yml
+++ /dev/null
@@ -1,49 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Inception v3 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then pruned
-  to **30.9%** of sparsity and quantized to INT8 fixed-point precision using
-  so-called Quantization-aware training approach implemented in TensorFlow framework.
-  The sparsity is represented by zeros inside the weights of Convolutional and
-  Fully-conneted layers. For details about the original floating point model,
-  check out the paper <https://arxiv.org/pdf/1512.03385.pdf>.
-
-  The model input is a blob that consists of a single image of "1x299x299x3"
-  in BGR order.
-
-  The model output for `inceptionv3-int8-sparse-v1-tf-0001` is the usual object
-  classifier output for the 1001 different classifications matching those in
-  the ImageNet database (the first item represents the background).
-task_type: classification
-files:
-  - name: FP32/inceptionv3-int8-sparse-v1-tf-0001.xml
-    size: 613524
-    sha256: 87930652f040d2247ff866afcac33fdb7ec195752115742c7c0e3a281d468852
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v1-tf-0001/FP32/inceptionv3-int8-sparse-v1-tf-0001.xml
-  - name: FP32/inceptionv3-int8-sparse-v1-tf-0001.bin
-    size: 95277636
-    sha256: 0f6d02a75232a81cffe0ed86e2dec132bd92cf6f69f6bb61f5fcd1a7641ede6b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v1-tf-0001/FP32/inceptionv3-int8-sparse-v1-tf-0001.bin
-  - name: FP16/inceptionv3-int8-sparse-v1-tf-0001.xml
-    size: 613425
-    sha256: c8475996cd397dfb391917981a4ed0da188a55a3ae1f0fb051ed29f1fbafd181
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v1-tf-0001/FP16/inceptionv3-int8-sparse-v1-tf-0001.xml
-  - name: FP16/inceptionv3-int8-sparse-v1-tf-0001.bin
-    size: 47638822
-    sha256: 242c61e090a4b5ee235084ddabe410a220feaddffefb5b9c40b99c56d27f51d5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v1-tf-0001/FP16/inceptionv3-int8-sparse-v1-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/inceptionv3-int8-sparse-v2-tf-0001/description/inceptionv3-int8-sparse-v2-tf-0001.md b/models/intel/inceptionv3-int8-sparse-v2-tf-0001/description/inceptionv3-int8-sparse-v2-tf-0001.md
deleted file mode 100644
index 9e7a94198bd..00000000000
--- a/models/intel/inceptionv3-int8-sparse-v2-tf-0001/description/inceptionv3-int8-sparse-v2-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# inceptionv3-int8-sparse-v2-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Inception v3 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **59.9%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x299x299x3" in BGR order.
-
-The model output for `inceptionv3-int8-sparse-v2-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 11.469        |
-| MParams           | 23.819        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 78.26% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        78.26% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,299,299,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/inceptionv3-int8-sparse-v2-tf-0001/model.yml b/models/intel/inceptionv3-int8-sparse-v2-tf-0001/model.yml
deleted file mode 100644
index 4d499184c20..00000000000
--- a/models/intel/inceptionv3-int8-sparse-v2-tf-0001/model.yml
+++ /dev/null
@@ -1,49 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Inception v3 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then pruned
-  to **59.9%** of sparsity and quantized to INT8 fixed-point precision using
-  so-called Quantization-aware training approach implemented in TensorFlow framework.
-  The sparsity is represented by zeros inside the weights of Convolutional and
-  Fully-conneted layers. For details about the original floating point model,
-  check out the paper <https://arxiv.org/pdf/1512.03385.pdf>.
-
-  The model input is a blob that consists of a single image of "1x299x299x3"
-  in BGR order.
-
-  The model output for `inceptionv3-int8-sparse-v2-tf-0001` is the usual object
-  classifier output for the 1001 different classifications matching those in
-  the ImageNet database (the first item represents the background).
-task_type: classification
-files:
-  - name: FP32/inceptionv3-int8-sparse-v2-tf-0001.xml
-    size: 613563
-    sha256: d18c00828bd59cb716501b06378716c9d2a3317961d7326b972747ce690094bf
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v2-tf-0001/FP32/inceptionv3-int8-sparse-v2-tf-0001.xml
-  - name: FP32/inceptionv3-int8-sparse-v2-tf-0001.bin
-    size: 95277636
-    sha256: ee0f9b9e7aa60a72a14696a000616e7ce230db032b1e47e86b13bed102aa6f50
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v2-tf-0001/FP32/inceptionv3-int8-sparse-v2-tf-0001.bin
-  - name: FP16/inceptionv3-int8-sparse-v2-tf-0001.xml
-    size: 613464
-    sha256: 86fcb895e570b59a80d5c899e1afa59a1b4804defc5a1a0a2e3141e25b7af535
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v2-tf-0001/FP16/inceptionv3-int8-sparse-v2-tf-0001.xml
-  - name: FP16/inceptionv3-int8-sparse-v2-tf-0001.bin
-    size: 47638822
-    sha256: 1fd2fc1119b7e956b1ae4a3faa5d4de2fdd20f2d6bc247a5f0e0fa601d56adfa
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-sparse-v2-tf-0001/FP16/inceptionv3-int8-sparse-v2-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/inceptionv3-int8-tf-0001/description/inceptionv3-int8-tf-0001.md b/models/intel/inceptionv3-int8-tf-0001/description/inceptionv3-int8-tf-0001.md
deleted file mode 100644
index b71b104829f..00000000000
--- a/models/intel/inceptionv3-int8-tf-0001/description/inceptionv3-int8-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# inceptionv3-int8-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Inception v3 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x299x299x3" in BGR order.
-
-The model output for `inceptionv3-int8-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 11.469        |
-| MParams           | 23.819        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 78.07% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        78.07% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,299,299,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/inceptionv3-int8-tf-0001/model.yml b/models/intel/inceptionv3-int8-tf-0001/model.yml
deleted file mode 100644
index 43a9ce941b4..00000000000
--- a/models/intel/inceptionv3-int8-tf-0001/model.yml
+++ /dev/null
@@ -1,47 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Inception v3 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then quantized
-  to INT8 fixed-point precision using so-called Quantization-aware training
-  approach implemented in TensorFlow framework. For details about the original
-  floating point model, check out the paper <https://arxiv.org/pdf/1512.03385.pdf>.
-
-  The model input is a blob that consists of a single image of "1x299x299x3"
-  in BGR order.
-
-  The model output for `inceptionv3-int8-tf-0001` is the usual object classifier
-  output for the 1001 different classifications matching those in the ImageNet
-  database (the first item represents the background).
-task_type: classification
-files:
-  - name: FP32/inceptionv3-int8-tf-0001.xml
-    size: 612437
-    sha256: 079b9fabee7796875b3e5bc8cadf868780280df1a9cc681387bb41da1b014d27
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-tf-0001/FP32/inceptionv3-int8-tf-0001.xml
-  - name: FP32/inceptionv3-int8-tf-0001.bin
-    size: 95277636
-    sha256: 5f1a34c4e1d925b5ec196e23c33a16df173e2f7788339b9b1390cd82a45cf488
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-tf-0001/FP32/inceptionv3-int8-tf-0001.bin
-  - name: FP16/inceptionv3-int8-tf-0001.xml
-    size: 612338
-    sha256: 0b9f55351e66e5b3d70e88a3b060601c37891868b70a6c84aa3a6be722c136a6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-tf-0001/FP16/inceptionv3-int8-tf-0001.xml
-  - name: FP16/inceptionv3-int8-tf-0001.bin
-    size: 47638822
-    sha256: da2daa50ad511e3b29e7645528536ebb32636df630f3dc1d927eed0922cec60e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/inceptionv3-int8-tf-0001/FP16/inceptionv3-int8-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/index.md b/models/intel/index.md
index b41fc1ad52d..7cb053aa9f1 100644
--- a/models/intel/index.md
+++ b/models/intel/index.md
@@ -18,26 +18,29 @@ detect the same types of objects (for example, `face-detection-adas-0001` and
 applicability at the cost of slower performance, so you can expect a "bigger"
 network to detect objects of the same type better.
 
-| Model Name                                                                                                                                                                          | Complexity (GFLOPs)  | Size (Mp)  | Face  | Person  | Vehicle  | Bike  | License plate  |
-|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |--------------------- |----------- |------ |-------- |--------- |------ |--------------- |
-| [face-detection-adas-0001](./face-detection-adas-0001/description/face-detection-adas-0001.md)                                                                                      | 2.835                | 1.053      | X     |         |          |       |                |
-| [face-detection-adas-binary-0001](./face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md)                                                                 | 0.819                | 1.053      | X     |         |          |       |                |
-| [face-detection-retail-0004](./face-detection-retail-0004/description/face-detection-retail-0004.md)                                                                                | 1.067                | 0.588      | X     |         |          |       |                |
-| [face-detection-retail-0005](./face-detection-retail-0005/description/face-detection-retail-0005.md)                                                                                | 0.982                | 1.021      | X     |         |          |       |                |
-| [person-detection-retail-0002](./person-detection-retail-0002/description/person-detection-retail-0002.md)                                                                          | 12.427               | 3.244      |       | X       |          |       |                |
-| [person-detection-retail-0013](./person-detection-retail-0013/description/person-detection-retail-0013.md)                                                                          | 2.300                | 0.723      |       | X       |          |       |                |
-| [person-detection-action-recognition-0005](./person-detection-action-recognition-0005/description/person-detection-action-recognition-0005.md)                                      | 7.140                | 1.951      |       | X       |          |       |                |
-| [person-detection-action-recognition-0006](./person-detection-action-recognition-0006/description/person-detection-action-recognition-0006.md)                                      | 8.225                | 2.001      |       | X       |          |       |                |
-| [person-detection-action-recognition-teacher-0002](./person-detection-action-recognition-teacher-0002/description/person-detection-action-recognition-teacher-0002.md)              | 7.140                | 1.951      |       | X       |          |       |                |
-| [person-detection-raisinghand-recognition-0001](./person-detection-raisinghand-recognition-0001/description/person-detection-raisinghand-recognition-0001.md)                    | 7.138                | 1.951      |       | X       |          |       |                |
-| [pedestrian-detection-adas-0002](./pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md)                                                                    | 2.836                | 1.165      |       | X       |          |       |                |
-| [pedestrian-detection-adas-binary-0001](./pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md)                                               | 0.945                | 1.165      |       | X       |          |       |                |
-| [pedestrian-and-vehicle-detector-adas-0001](./pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md)                                   | 3.974                | 1.650      |       | X       | X        |       |                |
-| [vehicle-detection-adas-0002](./vehicle-detection-adas-0002/description/vehicle-detection-adas-0002.md)                                                                             | 2.798                | 1.079      |       |         | X        |       |                |
-| [vehicle-detection-adas-binary-0001](./vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md)                                                        | 0.942                | 1.079      |       |         | X        |       |                |
-| [person-vehicle-bike-detection-crossroad-0078](./person-vehicle-bike-detection-crossroad-0078/description/person-vehicle-bike-detection-crossroad-0078.md)                          | 3.964                | 1.178      |       | X       | X        | X     |                |
-| [person-vehicle-bike-detection-crossroad-1016](./person-vehicle-bike-detection-crossroad-1016/description/person-vehicle-bike-detection-crossroad-1016.md)                          | 3.560                | 2.887      |       | X       | X        | X     |                |
-| [vehicle-license-plate-detection-barrier-0106](./vehicle-license-plate-detection-barrier-0106/description/vehicle-license-plate-detection-barrier-0106.md)                          | 0.349                | 0.634      |       |         | X        |       | X              |
+| Model Name                                                                                                                                                                          | Complexity (GFLOPs)  | Size (Mp)  | Face  | Person  | Vehicle  | Bike  | License plate  | Product |
+|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------ |--------------------- |----------- |------ |-------- |--------- |------ |--------------- |-------- |
+| [face-detection-adas-0001](./face-detection-adas-0001/description/face-detection-adas-0001.md)                                                                                      | 2.835                | 1.053      | X     |         |          |       |                |         |
+| [face-detection-adas-binary-0001](./face-detection-adas-binary-0001/description/face-detection-adas-binary-0001.md)                                                                 | 0.819                | 1.053      | X     |         |          |       |                |         |
+| [face-detection-retail-0004](./face-detection-retail-0004/description/face-detection-retail-0004.md)                                                                                | 1.067                | 0.588      | X     |         |          |       |                |         |
+| [face-detection-retail-0005](./face-detection-retail-0005/description/face-detection-retail-0005.md)                                                                                | 0.982                | 1.021      | X     |         |          |       |                |         |
+| [person-detection-retail-0002](./person-detection-retail-0002/description/person-detection-retail-0002.md)                                                                          | 12.427               | 3.244      |       | X       |          |       |                |         |
+| [person-detection-retail-0013](./person-detection-retail-0013/description/person-detection-retail-0013.md)                                                                          | 2.300                | 0.723      |       | X       |          |       |                |         |
+| [person-detection-action-recognition-0005](./person-detection-action-recognition-0005/description/person-detection-action-recognition-0005.md)                                      | 7.140                | 1.951      |       | X       |          |       |                |         |
+| [person-detection-action-recognition-0006](./person-detection-action-recognition-0006/description/person-detection-action-recognition-0006.md)                                      | 8.225                | 2.001      |       | X       |          |       |                |         |
+| [person-detection-action-recognition-teacher-0002](./person-detection-action-recognition-teacher-0002/description/person-detection-action-recognition-teacher-0002.md)              | 7.140                | 1.951      |       | X       |          |       |                |         |
+| [person-detection-raisinghand-recognition-0001](./person-detection-raisinghand-recognition-0001/description/person-detection-raisinghand-recognition-0001.md)                       | 7.138                | 1.951      |       | X       |          |       |                |         |
+| [pedestrian-detection-adas-0002](./pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md)                                                                    | 2.836                | 1.165      |       | X       |          |       |                |         |
+| [pedestrian-detection-adas-binary-0001](./pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md)                                               | 0.945                | 1.165      |       | X       |          |       |                |         |
+| [pedestrian-and-vehicle-detector-adas-0001](./pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md)                                   | 3.974                | 1.650      |       | X       | X        |       |                |         |
+| [vehicle-detection-adas-0002](./vehicle-detection-adas-0002/description/vehicle-detection-adas-0002.md)                                                                             | 2.798                | 1.079      |       |         | X        |       |                |         |
+| [vehicle-detection-adas-binary-0001](./vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md)                                                        | 0.942                | 1.079      |       |         | X        |       |                |         |
+| [person-vehicle-bike-detection-crossroad-0078](./person-vehicle-bike-detection-crossroad-0078/description/person-vehicle-bike-detection-crossroad-0078.md)                          | 3.964                | 1.178      |       | X       | X        | X     |                |         |
+| [person-vehicle-bike-detection-crossroad-1016](./person-vehicle-bike-detection-crossroad-1016/description/person-vehicle-bike-detection-crossroad-1016.md)                          | 3.560                | 2.887      |       | X       | X        | X     |                |         |
+| [vehicle-license-plate-detection-barrier-0106](./vehicle-license-plate-detection-barrier-0106/description/vehicle-license-plate-detection-barrier-0106.md)                          | 0.349                | 0.634      |       |         | X        |       | X              |         |
+| [product-detection-0001](./product-detection-0001/description/product-detection-0001.md)                                                                                            | 3.598                | 3.212      |       |         |          |       |                | X       |
+| [person-detection-asl-0001](./person-detection-asl-0001/description/person-detection-asl-0001.md)                                                                                   | 0.986                | 1.338      |       |      X  |          |       |                |         |
+
 
 ## Object Recognition Models
 
@@ -75,11 +78,15 @@ vectors that are "close" by L2 metric (Euclidean distance).
 There are multiple models that provide various trade-offs between performance
 and accuracy (expect a bigger model to perform better).
 
-| Model Name                                                                                                                        | Complexity (GFLOPs)  | Size (Mp)  | Pairwise accuracy |
+| Model Name                                                                                                                        | Complexity (GFLOPs)  | Size (Mp)  | Rank-1 |
 |-----------------------------------------------------------------------------------------------------------------------------------|--------------------- |----------- |------------------ |
 | [person-reidentification-retail-0031](./person-reidentification-retail-0031/description/person-reidentification-retail-0031.md)   | 0.028                | 0.280      | 92.11%            |
-| [person-reidentification-retail-0079](./person-reidentification-retail-0079/description/person-reidentification-retail-0079.md)   | 0.124                | 0.820      | 92.93%            |
-| [person-reidentification-retail-0076](./person-reidentification-retail-0076/description/person-reidentification-retail-0076.md)   | 0.594                | 0.820      | 93.35%            |
+| [person-reidentification-retail-0103](./person-reidentification-retail-0103/description/person-reidentification-retail-0103.md)   | 0.564                | 0.597      | 93.5%             |
+| [person-reidentification-retail-0107](./person-reidentification-retail-0107/description/person-reidentification-retail-0107.md)   | 0.174                | 0.183      | 91.7%             |
+| [person-reidentification-retail-0200](./person-reidentification-retail-0200/description/person-reidentification-retail-0200.md)   | 5.506                | 4.723      | 95.4%             |
+
+| Model Name                                                                                                                        | Complexity (GFLOPs)  | Size (Mp)  | Pairwise accuracy |
+|-----------------------------------------------------------------------------------------------------------------------------------|--------------------- |----------- |------------------ |
 | [face-reidentification-retail-0095](./face-reidentification-retail-0095/description/face-reidentification-retail-0095.md)         | 0.588                | 1.107      | 99.33%            |
 
 
@@ -96,7 +103,7 @@ detect areas with complex shape (for example, free space on the road).
 |------------------------------------------------------------------------------------------------------------------------------------------------|--------------------- |----------- |
 | [road-segmentation-adas-0001](./road-segmentation-adas-0001/description/road-segmentation-adas-0001.md)                                        | 4.770                | 0.184      |
 | [semantic-segmentation-adas-0001](./semantic-segmentation-adas-0001/description/semantic-segmentation-adas-0001.md)                            | 58.572               | 6.686      |
-
+| [unet-camvid-onnx-0001](./unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md)                                                          | 260.1                | 31.03      |
 
 ## Instance Segmentation Models
 
@@ -155,6 +162,16 @@ Deep Learning models for text recognition in various applications.
 | [text-recognition-0012](./text-recognition-0012/description/text-recognition-0012.md)                                                          | 1.485                | 5.568      |
 | [handwritten-score-recognition-0003](./handwritten-score-recognition-0003/description/handwritten-score-recognition-0003.md)                   | 0.792                | 5.555      |
 
+## Text Spotting
+
+Deep Learning models for text spotting (simultaneous detection and recognition).
+
+| Model Name                                                                                                                                     | Complexity (GFLOPs)  | Size (Mp)  |
+|------------------------------------------------------------------------------------------------------------------------------------------------|--------------------- |----------- |
+| [text-spotting-0001-detector](./text-spotting-0001-detector/description/text-spotting-0001-detector.md)                                        | 185.169             | 26.497    |
+| [text-spotting-0001-recognizer-encoder](./text-spotting-0001-recognizer-encoder/description/text-spotting-0001-recognizer-encoder.md)          | 2.082                | 1.328      |
+| [text-spotting-0001-recognizer-decoder](./text-spotting-0001-recognizer-decoder/description/text-spotting-0001-recognizer-decoder.md)          | 0.002                | 0.273      |
+
 ## Action Recognition Models
 
 Action Recognition models predict action that is being performed on a short video clip
@@ -169,6 +186,7 @@ that predict an actual labels are called *decoder*.
 | [driver-action-recognition-adas-0002-decoder](./driver-action-recognition-adas-0002-decoder/description/driver-action-recognition-adas-0002-decoder.md) | 0.147                | 4.205      |
 | [action-recognition-0001-encoder](./action-recognition-0001-encoder/description/action-recognition-0001-encoder.md)                                     | 7.340                | 21.276     |
 | [action-recognition-0001-decoder](./action-recognition-0001-decoder/description/action-recognition-0001-decoder.md)                                     | 0.147                | 4.405      |
+| [asl-recognition-0004](./asl-recognition-0004/description/asl-recognition-0004.md)                                                                      | 6.660                | 4.133      |
 
 ## Image Retrieval
 
@@ -185,15 +203,7 @@ Deep Learning compressed models
 | Model Name                                                                                                                                     | Complexity (GFLOPs)  | Size (Mp)  |
 |------------------------------------------------------------------------------------------------------------------------------------------------|--------------------- |----------- |
 | [resnet50-binary-0001](./resnet50-binary-0001/description/resnet50-binary-0001.md)                                                             | 1.002                | 7.446      |
-| [resnet-50-int8-tf-0001](./resnet-50-int8-tf-0001/description/resnet-50-int8-tf-0001.md)                                                       | 6.996                | 25.530     |
-| [resnet-50-int8-sparse-v1-tf-0001](./resnet-50-int8-sparse-v1-tf-0001/description/resnet-50-int8-sparse-v1-tf-0001.md)                         | 6.996                | 25.530     |
-| [resnet-50-int8-sparse-v2-tf-0001](./resnet-50-int8-sparse-v2-tf-0001/description/resnet-50-int8-sparse-v2-tf-0001.md)                         | 6.996                | 25.530     |
-| [inceptionv3-int8-tf-0001](./inceptionv3-int8-tf-0001/description/inceptionv3-int8-tf-0001.md)                                                 | 11.469               | 23.819     |
-| [inceptionv3-int8-sparse-v1-tf-0001](./inceptionv3-int8-sparse-v1-tf-0001/description/inceptionv3-int8-sparse-v1-tf-0001.md)                   | 11.469               | 23.819     |
-| [inceptionv3-int8-sparse-v2-tf-0001](./inceptionv3-int8-sparse-v2-tf-0001/description/inceptionv3-int8-sparse-v2-tf-0001.md)                   | 11.469               | 23.819     |
-| [mobilenetv2-int8-tf-0001](./mobilenetv2-int8-tf-0001/description/mobilenetv2-int8-tf-0001.md)                                                 | 0.615                | 3.489      |
-| [mobilenetv2-int8-sparse-v1-tf-0001](./mobilenetv2-int8-sparse-v1-tf-0001/description/mobilenetv2-int8-sparse-v1-tf-0001.md)                   | 0.615                | 3.489      |
-| [mobilenetv2-int8-sparse-v2-tf-0001](./mobilenetv2-int8-sparse-v2-tf-0001/description/mobilenetv2-int8-sparse-v2-tf-0001.md)                   | 0.615                | 3.489      |
+| [resnet18-xnor-binary-onnx-0001](./resnet18-xnor-binary-onnx-0001/description/resnet18-xnor-binary-onnx-0001.md)                               | -                    | -          |
 
 ## Legal Information
 [*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/instance-segmentation-security-0010/model.yml b/models/intel/instance-segmentation-security-0010/model.yml
index 387edf0efc2..a565abe250f 100644
--- a/models/intel/instance-segmentation-security-0010/model.yml
+++ b/models/intel/instance-segmentation-security-0010/model.yml
@@ -13,27 +13,26 @@
 # limitations under the License.
 
 description: >-
-  This model is an instance segmentation network for 80 classes of objects.
-  It is a Mask R-CNN with ResNeXt101-32x8 backbone, PANet feature refiner with
-  GroupNorm and DeformableConv operations and Adaptive Feature Pooling in all
-  ROI-wise heads.
+  General purpose instance segmentation model. Mask-RCNN with ResNet50 backbone -  PANet
+  feature refiner with GroupNorm and DeformableConv operations and Adaptive Feature
+  Pooling in all ROI-wise heads.
 task_type: instance_segmentation
 files:
   - name: FP32/instance-segmentation-security-0010.xml
-    size: 260969
-    sha256: d661968e82787b907046776c44f71aa2a8ad25f4cb850baee6df02b6f42c53df
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0010/FP32/instance-segmentation-security-0010.xml
+    size: 486381
+    sha256: f7acf2406403565dcd021bdab3746218462ef2afaabdea3be3a9669dac395c97
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0010/FP32/instance-segmentation-security-0010.xml
   - name: FP32/instance-segmentation-security-0010.bin
-    size: 688761824
-    sha256: 1c4d3791f5c28cdb0e716ee02bf8ff41f61d45e6d3b8692c97a6540aa2bc5437
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0010/FP32/instance-segmentation-security-0010.bin
+    size: 688762056
+    sha256: 030bb05fead246de1380b79d2d07674210f0bfab101a10d4827dd10b6abfdf4b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0010/FP32/instance-segmentation-security-0010.bin
   - name: FP16/instance-segmentation-security-0010.xml
-    size: 260759
-    sha256: 942d082768655d4bb337017b0b3a0b913df12d76c0075a3bfbfb569597fc7597
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0010/FP16/instance-segmentation-security-0010.xml
+    size: 486167
+    sha256: 706e59c4d68b5d1e81338c9fd3856bb7d21e781f959dc97beca35904d8db7afa
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0010/FP16/instance-segmentation-security-0010.xml
   - name: FP16/instance-segmentation-security-0010.bin
-    size: 344381010
-    sha256: 7aeb02fbe551607be9abb32a24e57c703bf992ee89138ce1b73644b56a3c7adb
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0010/FP16/instance-segmentation-security-0010.bin
+    size: 344381242
+    sha256: 8b8e17a8faeae41258f9fc3e758d987152a817c820aa82e1fd9bdbc2cf5db248
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0010/FP16/instance-segmentation-security-0010.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/instance-segmentation-security-0050/model.yml b/models/intel/instance-segmentation-security-0050/model.yml
index b4a9fb4f69b..776fcde21f0 100644
--- a/models/intel/instance-segmentation-security-0050/model.yml
+++ b/models/intel/instance-segmentation-security-0050/model.yml
@@ -13,26 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This model is an instance segmentation network for 80 classes of objects.
-  It is a Mask R-CNN with ResNet50 backbone, FPN and Bottom-Up Augmentation
-  blocks and light-weight RPN.
+  General purpose instance segmentation model. Mask-RCNN with ResNet50 backbone -  FPN
+  and Bottom-Up Augmentation blocks and light RPN and segmentation heads.
 task_type: instance_segmentation
 files:
   - name: FP32/instance-segmentation-security-0050.xml
-    size: 139021
-    sha256: 950b288887e299f6767b2588dd0a4fa726e5f91407f897c0a899917238852cde
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0050/FP32/instance-segmentation-security-0050.xml
+    size: 270496
+    sha256: 866ce49eb932bd070e68e8cf229c38e1d378612f4f1bc835ae65af5a3715416b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP32/instance-segmentation-security-0050.xml
   - name: FP32/instance-segmentation-security-0050.bin
-    size: 121497328
-    sha256: c923af7602592a17375e4dd7ba5b0869dc47022bd50d2558f58b1cca2ed6cfc9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0050/FP32/instance-segmentation-security-0050.bin
+    size: 121497384
+    sha256: 763f3503dc5f5fabd2021fa915783827929eb6b75555ddd95307e2226ec9325b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP32/instance-segmentation-security-0050.bin
   - name: FP16/instance-segmentation-security-0050.xml
-    size: 138915
-    sha256: 532d5c7cfc291c25609458fdf141f25b57dc5cd1db3a2994b98ea0ca3e88ae08
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0050/FP16/instance-segmentation-security-0050.xml
+    size: 270387
+    sha256: 3b23caae65f36c53155472b47a9623e0b2892de4ee4fb4b82eb1a732818d3f57
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP16/instance-segmentation-security-0050.xml
   - name: FP16/instance-segmentation-security-0050.bin
-    size: 60748674
-    sha256: 743058892ecaac32a6d789bfa177e11d335bd9b12257367b2ceed1304bf96cda
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0050/FP16/instance-segmentation-security-0050.bin
+    size: 60748730
+    sha256: 07a471da43c24d183feb048cf823e87e8add9952f43ad3da97b9425b38906e4b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP16/instance-segmentation-security-0050.bin
+  - name: FP32-INT8/instance-segmentation-security-0050.xml
+    size: 676861
+    sha256: 17ec5f1073fe347bac0cb63e599efee7ae93dfd95dd30d98bd237927a6dd23c8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP32-INT8/instance-segmentation-security-0050.xml
+  - name: FP32-INT8/instance-segmentation-security-0050.bin
+    size: 121755968
+    sha256: f808b09716132d5670ee213a6f1d3750e3af8bfedbc8e1ed4400ba9e299dd035
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0050/FP32-INT8/instance-segmentation-security-0050.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/instance-segmentation-security-0083/model.yml b/models/intel/instance-segmentation-security-0083/model.yml
index 46e0424ec28..72df0d765ad 100644
--- a/models/intel/instance-segmentation-security-0083/model.yml
+++ b/models/intel/instance-segmentation-security-0083/model.yml
@@ -13,26 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This model is an instance segmentation network for 80 classes of objects.
-  It is a Mask R-CNN model with ResNeXt152 backbone and Feature Pyramid Networks
-  block for feature maps refinement.
+  General purpose instance segmentation model. Mask-RCNN with ResNeXt152 backbone
+  and FPN block.
 task_type: instance_segmentation
 files:
   - name: FP32/instance-segmentation-security-0083.xml
-    size: 254824
-    sha256: 92a54f74e84084e35590819fcedd10ae77cbde3614cc25f0774b65ce7e6f89a2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0083/FP32/instance-segmentation-security-0083.xml
+    size: 512555
+    sha256: 81e9d91b096b0fed5613f02a397e3fb6e0b7605cdaff0ab9c4e24431c9b07bca
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP32/instance-segmentation-security-0083.xml
   - name: FP32/instance-segmentation-security-0083.bin
-    size: 564274416
-    sha256: 3226bf893e9877749c723532164952416dab5b812e825ad533c44285207a2f23
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0083/FP32/instance-segmentation-security-0083.bin
+    size: 564274472
+    sha256: 1305d27772c2fc16d84f78e3c6609eb065e106656403d1f0765270b334e7f1db
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP32/instance-segmentation-security-0083.bin
   - name: FP16/instance-segmentation-security-0083.xml
-    size: 254620
-    sha256: f8dfc935757cae047b665719402921dfb3b2ad9ccab1b1059492a09df189c3d0
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0083/FP16/instance-segmentation-security-0083.xml
+    size: 512347
+    sha256: 7371458aa674aff7e7f9ad0cb96a40b35b721576a0e3aec85b36b4fc1e8789ce
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP16/instance-segmentation-security-0083.xml
   - name: FP16/instance-segmentation-security-0083.bin
-    size: 282137218
-    sha256: 885f156f0947d873024dcdce51b1c5e59b60dd34d26b5bcc98da39b2267cca8b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/instance-segmentation-security-0083/FP16/instance-segmentation-security-0083.bin
+    size: 282137274
+    sha256: ae7bf1b3f18d3333df32bb9c5a09cbe7738396d6473fdd050508d4f38356c64f
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP16/instance-segmentation-security-0083.bin
+  - name: FP32-INT8/instance-segmentation-security-0083.xml
+    size: 1392902
+    sha256: ce4df508b7a9a2102e983f73ffb2e5750c8b76c197b9af668669183251c06de9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP32-INT8/instance-segmentation-security-0083.xml
+  - name: FP32-INT8/instance-segmentation-security-0083.bin
+    size: 565514024
+    sha256: 62f1b57b33e4386c44ddda8ab03d2cca30e30887ca354a2a3fd13dd157ff3f4d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/instance-segmentation-security-0083/FP32-INT8/instance-segmentation-security-0083.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/landmarks-regression-retail-0009/model.yml b/models/intel/landmarks-regression-retail-0009/model.yml
index 735cf02acd5..27bdbb2cae6 100644
--- a/models/intel/landmarks-regression-retail-0009/model.yml
+++ b/models/intel/landmarks-regression-retail-0009/model.yml
@@ -13,28 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is a lightweight landmarks regressor for the Smart Classroom scenario.
-  It has a classic convolutional design: stacked 3x3 convolutions, batch normalizations,
-  PReLU activations, and poolings. Final regression is done by the global depthwise
-  pooling head and FullyConnected layers. The model predicts five facial landmarks:
-  two eyes, nose, and two lip corners.
+  Landmark's detection. Used in Smart Classroom. The model is identical to 0002 but
+  trained on internal dataset with improved regression loss.
 task_type: object_attributes
 files:
   - name: FP32/landmarks-regression-retail-0009.xml
-    size: 18089
-    sha256: c9890b8db9025e17998db19dd0e037082f0e50838cb704ea8a60c6b5ad876602
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/landmarks-regression-retail-0009/FP32/landmarks-regression-retail-0009.xml
+    size: 42715
+    sha256: ef7aa8f3f2b9730df8612fc7221bd7beb423b6001202a452723efd86993358a3
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP32/landmarks-regression-retail-0009.xml
   - name: FP32/landmarks-regression-retail-0009.bin
     size: 762464
     sha256: 46795837d35e8199b7c5b57e1f76297827bf516a150c0d5643197d8c325f1dbc
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/landmarks-regression-retail-0009/FP32/landmarks-regression-retail-0009.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP32/landmarks-regression-retail-0009.bin
   - name: FP16/landmarks-regression-retail-0009.xml
-    size: 18074
-    sha256: 5bbd3da653942f7b9131f90f456f93fa79aa4825cbc24da19eeda954e37f082b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.xml
+    size: 42692
+    sha256: 01a0c7b4bbb0a12919351d78d551bbbe36a1fa62812c0f6ee1f49d7cc7bc10c0
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.xml
   - name: FP16/landmarks-regression-retail-0009.bin
-    size: 381232
-    sha256: 5d74c26cbb836b3de358ab05d4cbd92c4eb713dc74484cff9de82b2deb3d8527
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.bin
+    size: 381248
+    sha256: 973b13e64b3576f754a690266b069438b531bc657233d09d7b382ca36e6cf1e4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.bin
+  - name: FP32-INT8/landmarks-regression-retail-0009.xml
+    size: 78229
+    sha256: 1bf202dd4ea57ebc17762ea3173e1c482c1c8efb2aeeec13fa073429bfd766a2
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP32-INT8/landmarks-regression-retail-0009.xml
+  - name: FP32-INT8/landmarks-regression-retail-0009.bin
+    size: 767188
+    sha256: 2a4bbc1f41d80e3ad2125d9297825d49379647ee2f61d982962135d1a146ecb7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/landmarks-regression-retail-0009/FP32-INT8/landmarks-regression-retail-0009.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/license-plate-recognition-barrier-0001/model.yml b/models/intel/license-plate-recognition-barrier-0001/model.yml
index a12ef8b6983..36d813f7439 100644
--- a/models/intel/license-plate-recognition-barrier-0001/model.yml
+++ b/models/intel/license-plate-recognition-barrier-0001/model.yml
@@ -13,33 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This model uses a small-footprint network trained end-to-end to recognize Chinese
-  license plates in traffic.
+  Chinese license plate recognition
 task_type: optical_character_recognition
 files:
   - name: FP32/license-plate-recognition-barrier-0001.xml
-    size: 24492
-    sha256: f94ba60846d4de4077a8a162fe23f51f3b43981fa4da3c33b568d328173bd0ec
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.xml
+    size: 48904
+    sha256: 1440ca7fe1057204c53f977a14b47b51750fd2a6b43b82f9a22720837aca7228
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.xml
   - name: FP32/license-plate-recognition-barrier-0001.bin
-    size: 4871832
-    sha256: e28f7533481c31ee768bba89c6ee0ef05a1892c9919bd4abc125335a8644291d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.bin
+    size: 4871940
+    sha256: 3ef022a17b5f303c676c9c3a23669d09a257a54acdb894b6db295acc141cc4dd
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.bin
   - name: FP16/license-plate-recognition-barrier-0001.xml
-    size: 24474
-    sha256: 4d71aa3d8a86d1f6d772b76037f59e483beac7d4443a0369b335f95e67312fa1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml
+    size: 48885
+    sha256: 7af8d4457e30826bf292f7b4058546cac6f498afa46cf1ae64b923b93f0dc739
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml
   - name: FP16/license-plate-recognition-barrier-0001.bin
-    size: 2435930
-    sha256: cdead95dde2f27f85a192360343998ca6f0fac160a1aecdf7ecbda06eafc883f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.bin
-  - name: INT8/license-plate-recognition-barrier-0001.xml
-    size: 111802
-    sha256: 68093362cb0d3b62df410c1e9e6ecbada267d11669e19c7f3bcc450831b9fdac
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/INT8/license-plate-recognition-barrier-0001.xml
-  - name: INT8/license-plate-recognition-barrier-0001.bin
-    size: 4871832
-    sha256: bb27ed7f1d5afaf085c0eae990fe4bd491f40198e73144b2be2153bc7ac5b65f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/license-plate-recognition-barrier-0001/INT8/license-plate-recognition-barrier-0001.bin
+    size: 2436038
+    sha256: 184d9312c71b660639898edb46b85a99477e8d6a756b2b611e71a3afad5f25c1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.bin
+  - name: FP32-INT8/license-plate-recognition-barrier-0001.xml
+    size: 105464
+    sha256: 77a4a1eed9f54439cbddffb5e5f0068327af530e023135b273bff8b4b43c81f9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP32-INT8/license-plate-recognition-barrier-0001.xml
+  - name: FP32-INT8/license-plate-recognition-barrier-0001.bin
+    size: 4882552
+    sha256: 309f08580e1284a702c4d661ffc64cb370dfeb66622724b8dfb1e2ebee646720
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/license-plate-recognition-barrier-0001/FP32-INT8/license-plate-recognition-barrier-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/description/mobilenetv2-int8-sparse-v1-tf-0001.md b/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/description/mobilenetv2-int8-sparse-v1-tf-0001.md
deleted file mode 100644
index 16ff7f5205a..00000000000
--- a/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/description/mobilenetv2-int8-sparse-v1-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# mobilenetv2-int8-sparse-v1-tf-0001
-
-## Use Case and High-Level Description
-
-This is the MobileNet v2 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **30.8%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1801.04381.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `mobilenetv2-int8-sparse-v1-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 0.615         |
-| MParams           | 3.489         |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 71.42% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        71.42% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/model.yml b/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/model.yml
deleted file mode 100644
index aa5ce66bd86..00000000000
--- a/models/intel/mobilenetv2-int8-sparse-v1-tf-0001/model.yml
+++ /dev/null
@@ -1,37 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  Mobilenet v2 INT8 quantized and pruned to 30.8% weights sparsity rate in TensorFlow.
-  Acc@top-1 on ImageNet is 71.42.
-task_type: classification
-files:
-  - name: FP32/mobilenetv2-int8-sparse-v1-tf-0001.xml
-    size: 592370
-    sha256: ad805ce1d29933a37ed51ac34251ed4bf415384f1089bfeb80cfd0945b4b5013
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v1-tf-0001/FP32/mobilenetv2-int8-sparse-v1-tf-0001.xml
-  - name: FP32/mobilenetv2-int8-sparse-v1-tf-0001.bin
-    size: 13956420
-    sha256: 3f6013acbaf5787ebf048bfc9a8c229b5df937c885ac695bd240bb2642681b11
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v1-tf-0001/FP32/mobilenetv2-int8-sparse-v1-tf-0001.bin
-  - name: FP16/mobilenetv2-int8-sparse-v1-tf-0001.xml
-    size: 592309
-    sha256: 0effe16a9d2197c041802650616507cba0e90c29e982cbb36f6754a3ad2d2be5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v1-tf-0001/FP16/mobilenetv2-int8-sparse-v1-tf-0001.xml
-  - name: FP16/mobilenetv2-int8-sparse-v1-tf-0001.bin
-    size: 6978214
-    sha256: d06403010737b45a174aff161b8e3c60d56058ac55dcb827acbd0acc74d6e253
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v1-tf-0001/FP16/mobilenetv2-int8-sparse-v1-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/description/mobilenetv2-int8-sparse-v2-tf-0001.md b/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/description/mobilenetv2-int8-sparse-v2-tf-0001.md
deleted file mode 100644
index e47abb12d71..00000000000
--- a/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/description/mobilenetv2-int8-sparse-v2-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# mobilenetv2-int8-sparse-v2-tf-0001
-
-## Use Case and High-Level Description
-
-This is the MobileNet v2 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **59.3%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1801.04381.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `mobilenetv2-int8-sparse-v2-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 0.615         |
-| MParams           | 3.489         |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 70.85% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        70.85% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/model.yml b/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/model.yml
deleted file mode 100644
index 9270856589f..00000000000
--- a/models/intel/mobilenetv2-int8-sparse-v2-tf-0001/model.yml
+++ /dev/null
@@ -1,37 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  Mobilenet v2 INT8 quantized and pruned to 53.01% weights sparsity rate in TensorFlow.
-  Acc@top-1 on ImageNet is 70.856.
-task_type: classification
-files:
-  - name: FP32/mobilenetv2-int8-sparse-v2-tf-0001.xml
-    size: 592355
-    sha256: 1217995dd07bf053492ccd2a79f6154475fb12d8c5ea6ffe6fa4c4b1f6c07c46
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v2-tf-0001/FP32/mobilenetv2-int8-sparse-v2-tf-0001.xml
-  - name: FP32/mobilenetv2-int8-sparse-v2-tf-0001.bin
-    size: 13956420
-    sha256: 91da07cc56585c55d0906d23f0b549abb737ea07dac3fc0b37b1f3dc761c03e2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v2-tf-0001/FP32/mobilenetv2-int8-sparse-v2-tf-0001.bin
-  - name: FP16/mobilenetv2-int8-sparse-v2-tf-0001.xml
-    size: 592294
-    sha256: 6ff8be98e1afaa5261b281a713142cc1b68401d4a0bb00c1773cd85294bc64b8
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v2-tf-0001/FP16/mobilenetv2-int8-sparse-v2-tf-0001.xml
-  - name: FP16/mobilenetv2-int8-sparse-v2-tf-0001.bin
-    size: 6978214
-    sha256: 8315739354de5a429f806dc507d2e9f66256fe6e533fcfddcc2f3f6ac82c4992
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-sparse-v2-tf-0001/FP16/mobilenetv2-int8-sparse-v2-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/mobilenetv2-int8-tf-0001/description/mobilenetv2-int8-tf-0001.md b/models/intel/mobilenetv2-int8-tf-0001/description/mobilenetv2-int8-tf-0001.md
deleted file mode 100644
index ee211b88079..00000000000
--- a/models/intel/mobilenetv2-int8-tf-0001/description/mobilenetv2-int8-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# mobilenetv2-int8-tf-0001
-
-## Use Case and High-Level Description
-
-This is the MobileNet v2 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1801.04381.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `mobilenetv2-int8-tf-0001` is the usual object classifier output for the 1001 different classifications matching those in the ImageNet database (the first item represents the background).
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 0.615         |
-| MParams           | 3.489         |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 70.8% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |         70.8% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1001`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/mobilenetv2-int8-tf-0001/model.yml b/models/intel/mobilenetv2-int8-tf-0001/model.yml
deleted file mode 100644
index 86cb8fcb86e..00000000000
--- a/models/intel/mobilenetv2-int8-tf-0001/model.yml
+++ /dev/null
@@ -1,36 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  MobileNet v2 INT8 quantized in TensorFlow. Acc@Top-1 on ImageNet is 70.8.
-task_type: classification
-files:
-  - name: FP32/mobilenetv2-int8-tf-0001.xml
-    size: 593762
-    sha256: 310abe6133d9a243c21e83718b0f3c38b6657f010bb974ecb2ab56a2dabdeffd
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-tf-0001/FP32/mobilenetv2-int8-tf-0001.xml
-  - name: FP32/mobilenetv2-int8-tf-0001.bin
-    size: 13956428
-    sha256: 2e185fdad4286a1dca30b746e967e742cc70faf1f8f77f181c27792e8b39e668
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-tf-0001/FP32/mobilenetv2-int8-tf-0001.bin
-  - name: FP16/mobilenetv2-int8-tf-0001.xml
-    size: 593700
-    sha256: b32e04d238fc7124e6e3762ebe48057f011113a3f624cb40a1b071a370f345d1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-tf-0001/FP16/mobilenetv2-int8-tf-0001.xml
-  - name: FP16/mobilenetv2-int8-tf-0001.bin
-    size: 6978222
-    sha256: 0018413ca306188f334e54e00fea4599cb916c6c5de2999151894b1b18c54c0b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/mobilenetv2-int8-tf-0001/FP16/mobilenetv2-int8-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md b/models/intel/pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md
index c1a5a6224e6..954aef3b830 100644
--- a/models/intel/pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md
+++ b/models/intel/pedestrian-and-vehicle-detector-adas-0001/description/pedestrian-and-vehicle-detector-adas-0001.md
@@ -21,7 +21,7 @@ Pedestrian and vehicle detection network based on MobileNet v1.0 + SSD.
 | Source framework                | Caffe*                |
 
 Average Precision (AP) metric is described in: Mark Everingham et al.
-[“The PASCAL Visual Object Classes (VOC) Challenge”](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
+[The PASCAL Visual Object Classes (VOC) Challenge](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
 
 Tested on challenging internal datasets with 1001 pedestrian and 12585 vehicles to detect.
 
diff --git a/models/intel/pedestrian-and-vehicle-detector-adas-0001/model.yml b/models/intel/pedestrian-and-vehicle-detector-adas-0001/model.yml
index b3f5bbd3d94..2edb1f0294e 100644
--- a/models/intel/pedestrian-and-vehicle-detector-adas-0001/model.yml
+++ b/models/intel/pedestrian-and-vehicle-detector-adas-0001/model.yml
@@ -13,32 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Pedestrian and vehicle detection network based on MobileNet v1.0 + SSD.
+  Pedestrian and Vehicle detector based on ssd + mobilenet with reduced channels number.
 task_type: detection
 files:
   - name: FP32/pedestrian-and-vehicle-detector-adas-0001.xml
-    size: 88919
-    sha256: 8b32631050b6d21b290e221dcad7cb3203f4b026dab34896d1924c3f6f3976c3
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.xml
+    size: 245537
+    sha256: 3fd1c0f8b4a5867c9c7e6fd1be0ec8c71f1f905fb874b529c419980bb436c60a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.xml
   - name: FP32/pedestrian-and-vehicle-detector-adas-0001.bin
-    size: 6598484
-    sha256: 7ce62bc9708c2407b60269c968b5b0a3167aec47c4070e87634657134aa1aaf8
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.bin
+    size: 6598568
+    sha256: 9b8288591d18c3e3daa8bc48f9f2f14ecb1bf83032fe6439d6bc7b43f9f1a4e9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.bin
   - name: FP16/pedestrian-and-vehicle-detector-adas-0001.xml
-    size: 88872
-    sha256: c73e350277d5e69513fbd3d97f34f376851fd900db27335af0fc7b144bda361d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml
+    size: 245487
+    sha256: 6f24dfc89e0656a544c9a2cd040ca592fbda649328885193aa5eaa57d20d1d6f
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml
   - name: FP16/pedestrian-and-vehicle-detector-adas-0001.bin
-    size: 3299248
-    sha256: d5b2a74485313299515400f0de6b116a6cb5c776098a1f36bddf942f6fba2087
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.bin
-  - name: INT8/pedestrian-and-vehicle-detector-adas-0001.xml
-    size: 4796350
-    sha256: 0c06f8a4da402c419df43616bc44841fb5987f38c2e2a0d1d72caa5c4d76b678
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/INT8/pedestrian-and-vehicle-detector-adas-0001.xml
-  - name: INT8/pedestrian-and-vehicle-detector-adas-0001.bin
-    size: 6598484
-    sha256: 6d3da94b2f4cb6a63fb23ed34409d5c706877584c251e4610d6854f2d480d72c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-and-vehicle-detector-adas-0001/INT8/pedestrian-and-vehicle-detector-adas-0001.bin
+    size: 3299336
+    sha256: 3f9739b91277bc916f29b17d043115c6669e113e5d60d61589063d8054c40d7d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.bin
+  - name: FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.xml
+    size: 478288
+    sha256: 9f7c745d9f808018f02d435bb56a9eeadc26789fc37396032c215b97491a6e43
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.xml
+  - name: FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.bin
+    size: 6693280
+    sha256: 6157784eebd2a2e08bc5b0076f8d11868fbc096a0e60f5e34d72c8dd3ed32bb5
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-and-vehicle-detector-adas-0001/FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md b/models/intel/pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md
index 5c4f4e9a619..fd4f4806af2 100644
--- a/models/intel/pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md
+++ b/models/intel/pedestrian-detection-adas-0002/description/pedestrian-detection-adas-0002.md
@@ -20,7 +20,7 @@ Pedestrian detection network based on SSD framework with tuned MobileNet v1 as a
 | Source framework                | Caffe*                                    |
 
 Average Precision metric described in: Mark Everingham et al.
-[“The PASCAL Visual Object Classes (VOC) Challenge”](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
+[The PASCAL Visual Object Classes (VOC) Challenge](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
 
 Tested on an internal dataset with 1001 pedestrian to detect.
 
diff --git a/models/intel/pedestrian-detection-adas-0002/model.yml b/models/intel/pedestrian-detection-adas-0002/model.yml
index 47c231b68c1..9c2e2bbe686 100644
--- a/models/intel/pedestrian-detection-adas-0002/model.yml
+++ b/models/intel/pedestrian-detection-adas-0002/model.yml
@@ -13,33 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Pedestrian detection network based on SSD framework with tuned MobileNet v1
-  as a feature extractor.
+  Pedestrian detector based on ssd + mobilenet with reduced channels number.
 task_type: detection
 files:
   - name: FP32/pedestrian-detection-adas-0002.xml
-    size: 88868
-    sha256: 157058618cbe339a9093077704a12758c6d65e019bf890e404d67a97470352c4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.xml
+    size: 245421
+    sha256: 69dc36c52afc27f2ffa752e28e1710ca7653b3b7abda6e25c1fde7eb0767b480
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.xml
   - name: FP32/pedestrian-detection-adas-0002.bin
-    size: 4660164
-    sha256: d4b8cad14ad4e85cb88aca6ab3f55be4214c0fd04cd036b631f9b365eb287377
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.bin
+    size: 4660248
+    sha256: de3e3b12eb631d0fa67db14d7cd3c3aaea7edc78e460485dcdae3a447f4d4288
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.bin
   - name: FP16/pedestrian-detection-adas-0002.xml
-    size: 88818
-    sha256: e0e04bc21e695fb45a0d55667ed0f179c8a1adc53fc3f75b1155dc1588a9ae65
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.xml
+    size: 245369
+    sha256: 233519498b393adc8506bd80dd09d19f89e202b544565e7821a7fdff48bfa306
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.xml
   - name: FP16/pedestrian-detection-adas-0002.bin
-    size: 2330088
-    sha256: 6f5c036879005f87e2ddaf09d7c48988fc142e6c72182b2abc3d09b275f4597d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.bin
-  - name: INT8/pedestrian-detection-adas-0002.xml
-    size: 3952495
-    sha256: 6585f16fa7401b8eccd839ecca85b8acabab3f01793d85c31daa19401dac9b98
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/INT8/pedestrian-detection-adas-0002.xml
-  - name: INT8/pedestrian-detection-adas-0002.bin
-    size: 4660164
-    sha256: 929d7dba718a5e51745a0d6f331fc96013573ced80c72ff4b5125c32e51c4ce6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-0002/INT8/pedestrian-detection-adas-0002.bin
+    size: 2330176
+    sha256: 693753b7466da913b537016b31e3012f8ce6a885ac0897e3986eeca66d4ef8e6
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.bin
+  - name: FP32-INT8/pedestrian-detection-adas-0002.xml
+    size: 478047
+    sha256: d04b25d198b5a007d5301fa60d2b67634beaa30886b11c03ddc76df8506aed9a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP32-INT8/pedestrian-detection-adas-0002.xml
+  - name: FP32-INT8/pedestrian-detection-adas-0002.bin
+    size: 4740408
+    sha256: 38c3e849bd872a604a1374dffdb18520718c3c2d16fe13ce07642a986f68a273
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-0002/FP32-INT8/pedestrian-detection-adas-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md b/models/intel/pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md
index 8beb618a4ab..571511a3f17 100644
--- a/models/intel/pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md
+++ b/models/intel/pedestrian-detection-adas-binary-0001/description/pedestrian-detection-adas-binary-0001.md
@@ -19,10 +19,10 @@ Some layers of MobileNet v1 are binary and use I1 arithm
 | GFlops                          | 0.750                                     |
 | GI1ops                          | 2.086                                     |
 | MParams                         | 1.165                                     |
-| Source framework                | Pytorch*                                  |
+| Source framework                | PyTorch*                                  |
 
 Average Precision metric described in: Mark Everingham et al.
-[“The PASCAL Visual Object Classes (VOC) Challenge”](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
+[The PASCAL Visual Object Classes (VOC) Challenge](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
 
 Tested on an internal dataset with 1001 pedestrian to detect.
 
diff --git a/models/intel/pedestrian-detection-adas-binary-0001/model.yml b/models/intel/pedestrian-detection-adas-binary-0001/model.yml
index 5f992ddd293..f0c3b082a25 100644
--- a/models/intel/pedestrian-detection-adas-binary-0001/model.yml
+++ b/models/intel/pedestrian-detection-adas-binary-0001/model.yml
@@ -13,17 +13,17 @@
 # limitations under the License.
 
 description: >-
-  Pedestrian detection network based on SSD framework with tuned MobileNet v1
-  as a feature extractor. Some layers of MobileNet v1 are binary and use I1 arithm
+  Pedestrian detector based on ssd + mobilenet with reduced channels number binary
+  layers.
 task_type: detection
 files:
-  - name: INT1/pedestrian-detection-adas-binary-0001.xml
+  - name: FP32-INT1/pedestrian-detection-adas-binary-0001.xml
     size: 114635
     sha256: e64e7ce32c87e1c698b50abb8f2cf1d96c7651d45fc20bac09c417e046afa7f4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-binary-0001/INT1/pedestrian-detection-adas-binary-0001.xml
-  - name: INT1/pedestrian-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-binary-0001/FP32-INT1/pedestrian-detection-adas-binary-0001.xml
+  - name: FP32-INT1/pedestrian-detection-adas-binary-0001.bin
     size: 2338004
     sha256: 7c2761ca3859ef55a80d9ed924225df7ba363fcb151e4ec2f7d1061b70bdb374
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/pedestrian-detection-adas-binary-0001/INT1/pedestrian-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/pedestrian-detection-adas-binary-0001/FP32-INT1/pedestrian-detection-adas-binary-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-attributes-recognition-crossroad-0230/description/person-attributes-recognition-crossroad-0230.md b/models/intel/person-attributes-recognition-crossroad-0230/description/person-attributes-recognition-crossroad-0230.md
index 77ae428e87e..015f04bc541 100644
--- a/models/intel/person-attributes-recognition-crossroad-0230/description/person-attributes-recognition-crossroad-0230.md
+++ b/models/intel/person-attributes-recognition-crossroad-0230/description/person-attributes-recognition-crossroad-0230.md
@@ -1,7 +1,7 @@
 # person-attributes-recognition-crossroad-0230
 
 ## Use Case and High-Level Description
-This model presents a person attributes classification algorithm analysis scenario. It produces probability of person attributions existing on the sample and a position of two point on sample, whiches can be used for color prob (like, color picker in graphical editors)
+This model presents a person attributes classification algorithm analysis scenario. It produces probability of person attributions existing on the sample and a position of two point on sample, which can be used for color prob (like, color picker in graphical editors)
 
 ## Examples
 
@@ -21,7 +21,7 @@ This model presents a person attributes classification algorithm analysis scenar
 | Supported attributes  | is_male, has_bag, has_backpack, has hat, has longsleeves, has longpants, has longhair, has coat_jacket|
 | GFlops                | 0.174                                                                                                |
 | MParams               | 0.735                                                                                                |
-| Source framework      | Pytorch*                                                                                             |
+| Source framework      | PyTorch*                                                                                             |
 
 
 ## Accuracy
diff --git a/models/intel/person-attributes-recognition-crossroad-0230/model.yml b/models/intel/person-attributes-recognition-crossroad-0230/model.yml
index b721de655f2..c2c88067c2f 100644
--- a/models/intel/person-attributes-recognition-crossroad-0230/model.yml
+++ b/models/intel/person-attributes-recognition-crossroad-0230/model.yml
@@ -13,27 +13,25 @@
 # limitations under the License.
 
 description: >-
-  This model presents a person attributes classification algorithm analysis scenario.
-  It produces probability of person attributions existing on the sample and a
-  position of two point on sample, whiches can be used for color prob (like, color
-  picker in graphical editors)
+  Pedestrian attributes recognition based on a PVANet with hyperfeatures backbone
+  + classification head
 task_type: object_attributes
 files:
   - name: FP32/person-attributes-recognition-crossroad-0230.xml
-    size: 85544
-    sha256: 99d57e3a879c5fd5174651d2dd07f294d4e7c6d0f70bce55ca99f8638d023ef0
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-attributes-recognition-crossroad-0230/FP32/person-attributes-recognition-crossroad-0230.xml
+    size: 173336
+    sha256: bd911ccf0926eb48aae0c75ba385fd4783e6ad1680b80135b274a731e99b9c67
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-attributes-recognition-crossroad-0230/FP32/person-attributes-recognition-crossroad-0230.xml
   - name: FP32/person-attributes-recognition-crossroad-0230.bin
-    size: 2939224
-    sha256: 1d1c392826e77373d87fd1d7c65ce238c615f729e5524f1dfbc07a3a6c0cf8db
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-attributes-recognition-crossroad-0230/FP32/person-attributes-recognition-crossroad-0230.bin
+    size: 2939232
+    sha256: 01432edde876a4be8c7ef87801b7c45a09a442daec06551fd2db7c81f1d76407
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-attributes-recognition-crossroad-0230/FP32/person-attributes-recognition-crossroad-0230.bin
   - name: FP16/person-attributes-recognition-crossroad-0230.xml
-    size: 85458
-    sha256: 880592676c50a472f316db4b8f1745f3d9233e9234d0791e9a615107264e8e73
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-attributes-recognition-crossroad-0230/FP16/person-attributes-recognition-crossroad-0230.xml
+    size: 173251
+    sha256: 20f6e12b608e8910bebf5e229b943fb1356d2f2a55265cda04f2a5a7d7afbb58
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-attributes-recognition-crossroad-0230/FP16/person-attributes-recognition-crossroad-0230.xml
   - name: FP16/person-attributes-recognition-crossroad-0230.bin
-    size: 1469612
-    sha256: 033c56ba8e93c03604e78b99f9b7e5ab07fa57cfd1d865cb62fc001744fc6e72
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-attributes-recognition-crossroad-0230/FP16/person-attributes-recognition-crossroad-0230.bin
+    size: 1469624
+    sha256: 61327cb5748a234c0320456e83dc8e42756c3a9856f15580a111493da47366fc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-attributes-recognition-crossroad-0230/FP16/person-attributes-recognition-crossroad-0230.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-action-recognition-0005/model.yml b/models/intel/person-detection-action-recognition-0005/model.yml
index 4234a9f11cd..c0b3dee2d27 100644
--- a/models/intel/person-detection-action-recognition-0005/model.yml
+++ b/models/intel/person-detection-action-recognition-0005/model.yml
@@ -13,37 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is an action detector for the Smart Classroom scenario. It is based on
-  the RMNet backbone that includes depth-wise convolutions to reduce the amount
-  of computations for the 3x3 convolution block. The first SSD head from 1/16
-  scale feature map has four clustered prior boxes and outputs detected persons
-  (two class detector). The second SSD-based head predicts actions of the detected
-  persons. Possible actions: sitting, standing, raising hand.
+  Second generation of action detection (SSD-based) model to use in Smart Classroom.
 task_type: detection
 files:
   - name: FP32/person-detection-action-recognition-0005.xml
-    size: 282096
-    sha256: 69b18b2cfe6105bad2cf4970c8187f6879e79d16d8947029fa0993ed16dc71a3
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/FP32/person-detection-action-recognition-0005.xml
+    size: 651605
+    sha256: 7978b641bbc5fb9676ef18e35bec14d3541595b27454c95fab9ede178da0cc06
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP32/person-detection-action-recognition-0005.xml
   - name: FP32/person-detection-action-recognition-0005.bin
-    size: 7800264
-    sha256: b68ab79b18b570569024665ec9a72e1c15568c5721d243e0e74f0423560361db
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/FP32/person-detection-action-recognition-0005.bin
+    size: 7800360
+    sha256: 2982e6c2683229a450d674c362cc11abd640dce4e39e95925c7957a28011f147
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP32/person-detection-action-recognition-0005.bin
   - name: FP16/person-detection-action-recognition-0005.xml
-    size: 281852
-    sha256: d867fdbbfc189be1704d9e35e57ad684a3986669626ddbe4ca73d628927b98c9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/FP16/person-detection-action-recognition-0005.xml
+    size: 651362
+    sha256: 1d01cf1af48403eeb8f503e10416f94461e56dec2b3a038ae3a34da0807760b7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP16/person-detection-action-recognition-0005.xml
   - name: FP16/person-detection-action-recognition-0005.bin
-    size: 3900138
-    sha256: 72263b506b29f7d41eadd33386d67faebea19b35cf799ae876a807d35160da8f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/FP16/person-detection-action-recognition-0005.bin
-  - name: INT8/person-detection-action-recognition-0005.xml
-    size: 2081562
-    sha256: 9098c11bb19fb8718dd3bd8242ff7287e31d47d17930c63aa99740cbf3c34222
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/INT8/person-detection-action-recognition-0005.xml
-  - name: INT8/person-detection-action-recognition-0005.bin
-    size: 7804916
-    sha256: f154273ce9138d2314f68e24a2319fd1add8e9099bd3f8163e939b7d09e73df6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0005/INT8/person-detection-action-recognition-0005.bin
+    size: 3900234
+    sha256: 159f52fdd28bef5a3ef3edd998fe08fd4d51c4a3fb2b9134b82a09f6a252c378
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP16/person-detection-action-recognition-0005.bin
+  - name: FP32-INT8/person-detection-action-recognition-0005.xml
+    size: 1697244
+    sha256: 0f8f73f28ab61f3a0a0ed8abb65ce341278e457647a6636d6ee7a8164b62b320
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP32-INT8/person-detection-action-recognition-0005.xml
+  - name: FP32-INT8/person-detection-action-recognition-0005.bin
+    size: 7972512
+    sha256: cd8f809d2a6dfe12808a9a49c62fa3501c22fdff2c955961746a3c24e20d7db4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0005/FP32-INT8/person-detection-action-recognition-0005.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-action-recognition-0006/model.yml b/models/intel/person-detection-action-recognition-0006/model.yml
index c643697943c..2516f0f8803 100644
--- a/models/intel/person-detection-action-recognition-0006/model.yml
+++ b/models/intel/person-detection-action-recognition-0006/model.yml
@@ -17,28 +17,28 @@ description: >-
 task_type: detection
 files:
   - name: FP32/person-detection-action-recognition-0006.xml
-    size: 326861
-    sha256: 2ff9c68b16c0e09ba60f4e52a594ac4e7b36e57160ca416ef2e437bde2c88882
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.xml
+    size: 756047
+    sha256: 1ce4f689b91a2f6f7024faa25257c16ba3567e4aa437f3df3855892e1aa0336f
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.xml
   - name: FP32/person-detection-action-recognition-0006.bin
-    size: 7458792
-    sha256: 8d643910cd1e670f1832d989b7af1d90d14c44a665fb7fd3c6c5bdcb61a36517
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.bin
+    size: 7458352
+    sha256: 888d01b994c58baa65ab20b948439620222512ee49d45e6f443f271d7637f603
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.bin
   - name: FP16/person-detection-action-recognition-0006.xml
-    size: 326593
-    sha256: e9a1485f3fa28a3c49adaa4c2179730da8eb25647810d23e9b94748bdd39b12e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.xml
+    size: 755769
+    sha256: bb994602aef093f7566c0a0a567f11b1e76180a7f6bd3e67139377e298543394
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.xml
   - name: FP16/person-detection-action-recognition-0006.bin
-    size: 3729408
-    sha256: 1db6fef93efe3214720ce8d05ad52cd0f24c92c5c49fa72ebe6c32debb2e798f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.bin
-  - name: INT8/person-detection-action-recognition-0006.xml
-    size: 1512221
-    sha256: 8d007b657e8ff78ca5646fe2a765aa5f9012cf8d6b468d0c193ea4a2e45da3b1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/INT8/person-detection-action-recognition-0006.xml
-  - name: INT8/person-detection-action-recognition-0006.bin
-    size: 8004096
-    sha256: baa89392295213d85af91f271db6ca959d81df0a1352c5475f0a628621d6ce4b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-0006/INT8/person-detection-action-recognition-0006.bin
+    size: 3729222
+    sha256: 6752e639f4035582f77209a6030cded78ec4869b628ad9cdde1907d8cfd13368
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.bin
+  - name: FP32-INT8/person-detection-action-recognition-0006.xml
+    size: 1897659
+    sha256: 3f472adbeba1a9fd9ebaa552c9c07d32e5da32659467c5d6e4f330bfba0b5ddc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP32-INT8/person-detection-action-recognition-0006.xml
+  - name: FP32-INT8/person-detection-action-recognition-0006.bin
+    size: 7652264
+    sha256: 6ec864ac04c366c7bcfd77b8548b22d0d8797c4b6ad63bc759f10781aa573e7a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-0006/FP32-INT8/person-detection-action-recognition-0006.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-action-recognition-teacher-0002/model.yml b/models/intel/person-detection-action-recognition-teacher-0002/model.yml
index 73755cbabce..e7d8647c4bd 100644
--- a/models/intel/person-detection-action-recognition-teacher-0002/model.yml
+++ b/models/intel/person-detection-action-recognition-teacher-0002/model.yml
@@ -13,29 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is an action detector for the Smart Classroom scenario. It is based on
-  the RMNet backbone that includes depth-wise convolutions to reduce the amount
-  of computations for the 3x3 convolution block. The first SSD head from 1/16
-  scale feature map has four clustered prior boxes and outputs detected persons
-  (two class detector). The second SSD-based head predicts actions of the detected
-  persons. Possible actions: standing, writing, demonstrating.
+  Second generation of action detection (SSD-based) model to use in Smart Classroom
+  for classification teacher's actions.
 task_type: detection
 files:
   - name: FP32/person-detection-action-recognition-teacher-0002.xml
-    size: 282104
-    sha256: 4034363f7e92ea1acba7e9d0bcd08286dcbbf5311041c464b26d081b73c5f54c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-teacher-0002/FP32/person-detection-action-recognition-teacher-0002.xml
+    size: 651618
+    sha256: 0853dc3856c28ae2058a02db7522f7f5d66c49c82f60ff4b51d1377d5a322484
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP32/person-detection-action-recognition-teacher-0002.xml
   - name: FP32/person-detection-action-recognition-teacher-0002.bin
-    size: 7800264
-    sha256: 711ab8b5737f72d6087c86c017e97d8ebc6e29795b5c63c7665f1e1c37909347
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-teacher-0002/FP32/person-detection-action-recognition-teacher-0002.bin
+    size: 7800360
+    sha256: ebe9c7cdca28a408302b3b1f241afdc670abc251bd692c13a3140c78b08b0498
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP32/person-detection-action-recognition-teacher-0002.bin
   - name: FP16/person-detection-action-recognition-teacher-0002.xml
-    size: 281860
-    sha256: eca9d4d638e3e5786b8c9777ee66aaaa0a0d2aef66e143964cc6b78388ee32e5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-teacher-0002/FP16/person-detection-action-recognition-teacher-0002.xml
+    size: 651375
+    sha256: 36cd0bd99542386fd15c083e8325c37f920f95173d314d9406fd3ce41ac73df7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP16/person-detection-action-recognition-teacher-0002.xml
   - name: FP16/person-detection-action-recognition-teacher-0002.bin
-    size: 3900138
-    sha256: 9854776b1233e7021deaeb3fc0fe245375b67bd9c5d3e1528d04286b1793e440
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-action-recognition-teacher-0002/FP16/person-detection-action-recognition-teacher-0002.bin
+    size: 3900234
+    sha256: 190e9b71ae02e022c6afe2dc9fb59939066e046234ff35f4ceab6ddfabab7883
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP16/person-detection-action-recognition-teacher-0002.bin
+  - name: FP32-INT8/person-detection-action-recognition-teacher-0002.xml
+    size: 1697252
+    sha256: 1f363ddd0a09837c06d28b49514db1c81beafb2ba95ea40700a0b26688266d1e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP32-INT8/person-detection-action-recognition-teacher-0002.xml
+  - name: FP32-INT8/person-detection-action-recognition-teacher-0002.bin
+    size: 7972512
+    sha256: 9423a50cb23b265d8862108a7ab88e1536c1b342276d792af56ff3d34d70553d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-action-recognition-teacher-0002/FP32-INT8/person-detection-action-recognition-teacher-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.md b/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.md
new file mode 100644
index 00000000000..803a33aaad5
--- /dev/null
+++ b/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.md
@@ -0,0 +1,44 @@
+# person-detection-asl-0001
+
+## Use case and High-level description
+
+This is a person detector for the ASL Recognition scenario. It is based on ShuffleNetV2-like backbone that includes depth-wise convolutions to reduce the amount of computation for the 3x3 convolution block and FCOS  head.
+
+## Example
+
+![](./person-detection-asl-0001.png)
+
+## Specification
+
+| Metric                          | Value                                     |
+|---------------------------------|-------------------------------------------|
+| Persons AP on MS-COCO\*         | 77.68%                                    |
+| Minimal person height           | 100 pixel                                 |
+| GFlops                          | 0.986                                     |
+| MParams                         | 1.338                                     |
+| Source framework                | PyTorch\*                                 |
+
+Average Precision (AP) is defined as an area under the [precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
+
+## Performance
+
+## Inputs
+
+Name: "input" , shape: [1x3x320x320] - An input image in the format [1xCxHxW], where:
+ - C - number of channels
+ - H - image height
+ - W - image width
+
+Expected color order is BGR.
+
+## Outputs
+
+The net outputs blob with shape: [N, 5], where N is the number of detected
+bounding boxes. For each detection, the description has the format:
+[`x_min`, `y_min`, `x_max`, `y_max`, `conf`]
+ - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+ - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner.
+ - `conf` - confidence for the predicted class
+
+## Legal Information
+[\*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.png b/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.png
new file mode 100644
index 00000000000..de3f62ab777
Binary files /dev/null and b/models/intel/person-detection-asl-0001/description/person-detection-asl-0001.png differ
diff --git a/models/intel/person-detection-asl-0001/model.yml b/models/intel/person-detection-asl-0001/model.yml
new file mode 100644
index 00000000000..596a11ed113
--- /dev/null
+++ b/models/intel/person-detection-asl-0001/model.yml
@@ -0,0 +1,28 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Person detector (ShuffleNetv2 backbone and FCOS head) for ASL scenario
+task_type: detection
+files:
+  - name: FP32/person-detection-asl-0001.xml
+    size: 569024
+    sha256: 642f7ee90b171a43c6af110f00a0bf514b275beff7ddebad1837eeae6143f885
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-asl-0001/FP32/person-detection-asl-0001.xml
+  - name: FP32/person-detection-asl-0001.bin
+    size: 4026864
+    sha256: d6ee1d8204f84f0f7ed9f7567dabaabad0b9c31db8113bdb5da82bfa66afaee8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-asl-0001/FP32/person-detection-asl-0001.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-raisinghand-recognition-0001/model.yml b/models/intel/person-detection-raisinghand-recognition-0001/model.yml
index 00612c5469f..66f691e5d9d 100644
--- a/models/intel/person-detection-raisinghand-recognition-0001/model.yml
+++ b/models/intel/person-detection-raisinghand-recognition-0001/model.yml
@@ -13,29 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is an action detector for the Smart Classroom scenario. It is based on
-  the RMNet backbone that includes depth-wise convolutions to reduce the amount
-  of computations for the 3x3 convolution block. The first SSD head from 1/16
-  scale feature map has four clustered prior boxes and outputs detected persons
-  (two class detector). The second SSD-based head predicts actions of the detected
-  persons. Possible actions: raising hand and other.
+  Raising-hand action detection (SSD-based) model to use in Smart Classroom environment.
 task_type: detection
 files:
   - name: FP32/person-detection-raisinghand-recognition-0001.xml
-    size: 282101
-    sha256: eb4ece57971d7cb1d3eaa154bf3e28f1f9b38a83b3876eda6f2c49ea37bf24b6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-raisinghand-recognition-0001/FP32/person-detection-raisinghand-recognition-0001.xml
+    size: 651616
+    sha256: a94101be18b2501395c355c7751750538b62bcff8692bdc7e812382a176f7c78
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP32/person-detection-raisinghand-recognition-0001.xml
   - name: FP32/person-detection-raisinghand-recognition-0001.bin
-    size: 7799752
-    sha256: 327aeec1ddc53cc03406ca28c45d4b8b9965030b353142d9cc0c13f229991a61
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-raisinghand-recognition-0001/FP32/person-detection-raisinghand-recognition-0001.bin
+    size: 7799848
+    sha256: 5183cc9d4d71e208a2cc70db9ea98bf14657d07b2bfafd050aeae9687e4359c4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP32/person-detection-raisinghand-recognition-0001.bin
   - name: FP16/person-detection-raisinghand-recognition-0001.xml
-    size: 281857
-    sha256: fe23745d025815ec52301b8ea7f4cc7dbc8aece9b621a8fd79b38bc6d34286e3
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-raisinghand-recognition-0001/FP16/person-detection-raisinghand-recognition-0001.xml
+    size: 651372
+    sha256: bae03b3a203b70ccdb39a77342d446642039522e7dae6e6a8b1efeedcf7a8582
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP16/person-detection-raisinghand-recognition-0001.xml
   - name: FP16/person-detection-raisinghand-recognition-0001.bin
-    size: 3899882
-    sha256: 58ff7bba9d4f10665dd52aa011fcfe6184cccfbd48f3ecfef79b90033de1e6a5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-raisinghand-recognition-0001/FP16/person-detection-raisinghand-recognition-0001.bin
+    size: 3899978
+    sha256: 601543473374722d45eb56b3aa8f7f250f33e1bb548d63e392332441e97c87d8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP16/person-detection-raisinghand-recognition-0001.bin
+  - name: FP32-INT8/person-detection-raisinghand-recognition-0001.xml
+    size: 1697233
+    sha256: 31d964647910358bc31f4ce2a165a6dbce21812997ecb7bb166a8fb75a0f87b1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP32-INT8/person-detection-raisinghand-recognition-0001.xml
+  - name: FP32-INT8/person-detection-raisinghand-recognition-0001.bin
+    size: 7971992
+    sha256: 7d7e37fb6404d15a9adedbf89f62b7748043c0f7cb98fea907467c9e78609e9d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-raisinghand-recognition-0001/FP32-INT8/person-detection-raisinghand-recognition-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-retail-0002/description/person-detection-retail-0002.md b/models/intel/person-detection-retail-0002/description/person-detection-retail-0002.md
index 7d92e741b95..13b28abe595 100644
--- a/models/intel/person-detection-retail-0002/description/person-detection-retail-0002.md
+++ b/models/intel/person-detection-retail-0002/description/person-detection-retail-0002.md
@@ -39,7 +39,7 @@ curve. Validation dataset consists of ~50K of images from ~100 different scenes.
 
 ## Outputs
 
-1. The net outputs "detection_ouput" blob with shape: [1x1xNx7], where N is the number of detected pedestrians.
+1. The net outputs "detection_output" blob with shape: [1x1xNx7], where N is the number of detected pedestrians.
    For each detection, the description has the format:
    [`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`], where:
    - `image_id` - ID of image in batch
diff --git a/models/intel/person-detection-retail-0002/model.yml b/models/intel/person-detection-retail-0002/model.yml
index 1be72969cef..743788bc302 100644
--- a/models/intel/person-detection-retail-0002/model.yml
+++ b/models/intel/person-detection-retail-0002/model.yml
@@ -12,24 +12,33 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-description: Person detection (HyperNet+RFCN+DetectionOutput).
+description: >-
+  Person detection (HyperNet+RFCN+DetectionOutput). Used in Audience Analytics.
 task_type: detection
 files:
   - name: FP32/person-detection-retail-0002.xml
-    size: 132390
-    sha256: a5cc947c7594a749432cc5acf57a81f091ff35c58fb399e7b0fbb020246cad72
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0002/FP32/person-detection-retail-0002.xml
+    size: 267910
+    sha256: f320676380eaf3dacfceca934a52ce897889dec6fdcc10e7b99e51dd80912ded
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP32/person-detection-retail-0002.xml
   - name: FP32/person-detection-retail-0002.bin
-    size: 12976388
-    sha256: 78f600869517ee2a9ecc79505b5cfab9849c4c4494035041993c97cc7f4fb745
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0002/FP32/person-detection-retail-0002.bin
+    size: 12976100
+    sha256: 8150eb7ea3352abb272276deb3ce64d0414464e9f4bf02739ec4f2770b8acb75
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP32/person-detection-retail-0002.bin
   - name: FP16/person-detection-retail-0002.xml
-    size: 132266
-    sha256: 83726d14a07f4d73fab65a9a765c8e043aeced04cb2676a15920fc2d65d326ba
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0002/FP16/person-detection-retail-0002.xml
+    size: 267787
+    sha256: 3f3960a9cc61bb1416e5e362e2133139be76b5db07ddf18b7b776e80cfe140c4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP16/person-detection-retail-0002.xml
   - name: FP16/person-detection-retail-0002.bin
-    size: 6488220
-    sha256: 04d28806b41709a01e803a1da0894c17d8033f93e6d38822a732f2ba2fe6ea1c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0002/FP16/person-detection-retail-0002.bin
+    size: 6488130
+    sha256: 32008b134ea50eb70a4f97d74562a0a2c542d3c30f19a5d7ef1b57e8615d7039
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP16/person-detection-retail-0002.bin
+  - name: FP32-INT8/person-detection-retail-0002.xml
+    size: 694526
+    sha256: 0251fad4e66e14133b9544d4bd9ac3096ff06d45efff3a3a63fe494bb3d37987
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP32-INT8/person-detection-retail-0002.xml
+  - name: FP32-INT8/person-detection-retail-0002.bin
+    size: 13051624
+    sha256: d700bd305d836b6f136043d71647f5f501edb0cf9251e60c6a25f4f239289403
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0002/FP32-INT8/person-detection-retail-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-detection-retail-0013/model.yml b/models/intel/person-detection-retail-0013/model.yml
index edc7ff9c60e..2859ee13152 100644
--- a/models/intel/person-detection-retail-0013/model.yml
+++ b/models/intel/person-detection-retail-0013/model.yml
@@ -13,35 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a pedestrian detector for the Retail scenario. It is based on MobileNetV2-like
-  backbone that includes depth-wise convolutions to reduce the amount of computation
-  for the 3x3 convolution block. The single SSD head from 1/16 scale feature map
-  has 12 clustered prior boxes.
+  Pedestrian detection (RMNet with lrelu + SSD)
 task_type: detection
 files:
   - name: FP32/person-detection-retail-0013.xml
-    size: 155885
-    sha256: 05b408a1d7f2934eb2819312931bd2a81cb27fee26bec804766e17fb1be2f5af
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/FP32/person-detection-retail-0013.xml
+    size: 354260
+    sha256: d83a9b8a82a9e6fb52c73f63c4ab6e71d57592c8b2068a85f14548df7cef8eae
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP32/person-detection-retail-0013.xml
   - name: FP32/person-detection-retail-0013.bin
-    size: 2891268
-    sha256: c870150640a9ed9e6ab7e3d93398d4ca7604d7b97569b77ee7494649271bbc83
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/FP32/person-detection-retail-0013.bin
+    size: 2891364
+    sha256: 6f09cb7061328942f9d5e9fc81631a4234be66a26daa50cd672d4077ee82ad44
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP32/person-detection-retail-0013.bin
   - name: FP16/person-detection-retail-0013.xml
-    size: 155730
-    sha256: ff1fd1351a241ce52b5044c62253f9947aba9bfdcb92dda3bc94d12c9b4b35ad
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/FP16/person-detection-retail-0013.xml
+    size: 354107
+    sha256: 603502ad82af0ee6b0ee9948257aece2599ac2b153df1691b3fe5b0c33fe3a88
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP16/person-detection-retail-0013.xml
   - name: FP16/person-detection-retail-0013.bin
-    size: 1445640
-    sha256: 77eb13de84d9368da1d437aece02ba14b4ff0e48b194feb48a8b5076c861039a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/FP16/person-detection-retail-0013.bin
-  - name: INT8/person-detection-retail-0013.xml
-    size: 1997589
-    sha256: e9b396acf7acd7c5560622cf00bd591f30c8c5ef3c6a4f6fa14e70b053061a3b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/INT8/person-detection-retail-0013.xml
-  - name: INT8/person-detection-retail-0013.bin
-    size: 2891268
-    sha256: efdc2566e15bbc1e31990eb0a7a35becacc076e052212ec6f2b7341d0f33cb8e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-detection-retail-0013/INT8/person-detection-retail-0013.bin
+    size: 1445736
+    sha256: 56eeccbeb3f27144046edacb95b459d60f3930f54051ef5b9e5253923c07b672
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP16/person-detection-retail-0013.bin
+  - name: FP32-INT8/person-detection-retail-0013.xml
+    size: 931279
+    sha256: 8f7e71c2db19f1f641346ff9cd99553e650b42c00a96c9bbfaf2bcbbd6daa49d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP32-INT8/person-detection-retail-0013.xml
+  - name: FP32-INT8/person-detection-retail-0013.bin
+    size: 2969676
+    sha256: 523b79294453845934e068f4a906b9bf88b4c70ab705f2137e089439f4555b92
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-detection-retail-0013/FP32-INT8/person-detection-retail-0013.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0031/description/person-reidentification-retail-0031.md b/models/intel/person-reidentification-retail-0031/description/person-reidentification-retail-0031.md
index 36a7a424a9c..855c6fd46f1 100644
--- a/models/intel/person-reidentification-retail-0031/description/person-reidentification-retail-0031.md
+++ b/models/intel/person-reidentification-retail-0031/description/person-reidentification-retail-0031.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is a person reidentification model for a general scenario. It uses a whole body image as an input and outputs an embedding vector to match a pair of images by the Cosine distance. The model is based on RMNet backbone that was developed for fast inference. A single reidentification head from the 1/16 scale feature map outputs the embedding vector of 256 floats.
+This is a person reidentification model for a general scenario. It uses a whole body image as an input and outputs an embedding vector to match a pair of images by the cosine distance. The model is based on the RMNet backbone developed for fast inference. A single reidentification head from the 1/16 scale feature map outputs an embedding vector of 256 floats.
 
 ## Example
 
@@ -22,13 +22,13 @@ This is a person reidentification model for a general scenario. It uses a whole
 | Source framework                  | Caffe*                                    |
 
 The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility to locate at least one true positive in the top-1 rank.
-Mean Average Precision (mAP) is the mean across all queries’ Average Precision (AP) and AP is defined as an area under the [precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
+Mean Average Precision (mAP) is the mean across Average Precision (AP) of all queries. AP is defined as the area under the [precision and recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
 
 ## Performance
 
 ## Inputs
 
-1. name: "data" , shape: [1x3x96x48] - An input image in the format [BxCxHxW],
+1. Name: `data` , shape: [1x3x96x48]. An input image in the format [BxCxHxW],
    where:
     - B - batch size
     - C - number of channels
@@ -39,7 +39,7 @@ Mean Average Precision (mAP) is the mean across all queries’ Average Precision
 
 ## Outputs
 
-1. The net outputs a blob with shape: [1, 256, 1, 1] named descriptor, which can be compared with other descriptors using the [Cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
+1. The net outputs a blob with the [1, 256, 1, 1] shape named `descriptor`, which can be compared with other descriptors using the [cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
 
 ## Legal Information
 [*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0031/model.yml b/models/intel/person-reidentification-retail-0031/model.yml
index 7a67b8c12d5..e9850e9b291 100644
--- a/models/intel/person-reidentification-retail-0031/model.yml
+++ b/models/intel/person-reidentification-retail-0031/model.yml
@@ -13,36 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a person reidentification model for a general scenario. It uses a whole
-  body image as an input and outputs an embedding vector to match a pair of images
-  by the Cosine distance. The model is based on RMNet backbone that was developed
-  for fast inference. A single reidentification head from the 1/16 scale feature
-  map outputs the embedding vector of 256 floats.
+  Single embedding-based person reidentification model (fastest person ReID model)
 task_type: object_attributes
 files:
   - name: FP32/person-reidentification-retail-0031.xml
-    size: 66640
-    sha256: b2b23a9f79ed992081efd0dd9448074196f338af4b9dcaf9bac4c0b078a1446d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/FP32/person-reidentification-retail-0031.xml
+    size: 136151
+    sha256: d4b9d09fd6acedb368a3c3dc1e61a1e1500ba51308fe7b03e369bc32810eadc1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP32/person-reidentification-retail-0031.xml
   - name: FP32/person-reidentification-retail-0031.bin
-    size: 1120184
-    sha256: 8b9d349d330909815d2e75b57654c4cd6c27eb37c87d3280dfeaae03d166a4f4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/FP32/person-reidentification-retail-0031.bin
+    size: 1120216
+    sha256: 8343531e60f2e36da8311bb768de42b9b03b51d848510da74cb5bf7cbb790823
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP32/person-reidentification-retail-0031.bin
   - name: FP16/person-reidentification-retail-0031.xml
-    size: 66578
-    sha256: 3f6c0946aab9911978e45b036278b275f02b2dd7444a0d20614193900ffbbd09
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/FP16/person-reidentification-retail-0031.xml
+    size: 136089
+    sha256: 540e578f5aa87e85b5a25201cc7a6d389762e7f69b062acd88901275d398f592
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP16/person-reidentification-retail-0031.xml
   - name: FP16/person-reidentification-retail-0031.bin
-    size: 560092
-    sha256: 833c136bcce82bcba6de6289fc21ee24f24d4597e52c41717c2602ee275b2f7d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/FP16/person-reidentification-retail-0031.bin
-  - name: INT8/person-reidentification-retail-0031.xml
-    size: 264617
-    sha256: 9441b1128224dc60ee5e14cdb62ec1eb045d6fc7ef363fab014bd6f729f3be50
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/INT8/person-reidentification-retail-0031.xml
-  - name: INT8/person-reidentification-retail-0031.bin
-    size: 1120184
-    sha256: 5533422c49746f6856dca186822a9a15c47b88dffced26401b374ba99e731f57
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0031/INT8/person-reidentification-retail-0031.bin
+    size: 560124
+    sha256: 67e230352812b64ede186c62aaf7369a63fd6f5d8d9a8c98fb7138dac1dfd8bb
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP16/person-reidentification-retail-0031.bin
+  - name: FP32-INT8/person-reidentification-retail-0031.xml
+    size: 385535
+    sha256: 9e77f629b83f0f3c09118b5c231d2f99ca806b0a6cc5942640198fd15f20b49e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP32-INT8/person-reidentification-retail-0031.xml
+  - name: FP32-INT8/person-reidentification-retail-0031.bin
+    size: 1153352
+    sha256: 09c24cd2a8d7f0460d3f9b12dbb04c62198a9d1fe27df52ff75ceea72e046dbd
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0031/FP32-INT8/person-reidentification-retail-0031.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.md b/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.md
deleted file mode 100644
index a076747a044..00000000000
--- a/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# person-reidentification-retail-0076
-
-## Use Case and High-Level Description
-
-This is a person reidentification model for a general scenario. It uses a whole body image as an input and outputs an embedding vector to match a pair of images by the Cosine distance. The model is based on RMNet backbone that was developed for fast inference. A single reidentification head from the 1/16 scale feature map outputs the embedding vector of 256 floats. The model is provided without last calibration layer, but can be used in the same way as the original model (with insignificant drop in accuracy).
-
-## Example
-
-![](./person-reidentification-retail-0076.png)
-
-## Specification
-
-| Metric                            | Value                                     |
-|-----------------------------------|-------------------------------------------|
-| Market-1501 rank@1 accuracy       | 0.9237                                    |
-| Market-1501 mAP                   | 0.8253                                    |
-| Pose coverage                     | Standing upright, parallel to image plane |
-| Support of occluded pedestrians   | YES                                       |
-| Occlusion coverage                | <50%                                      |
-| GFlops                            | 0.594                                     |
-| MParams                           | 0.820                                     |
-| Source framework                  | Caffe*                                    |
-
-The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility to locate at least one true positive in the top-1 rank.
-Mean Average Precision (mAP) is the mean across all queries’ Average Precision (AP) and AP is defined as an area under the [precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
-
-## Performance
-
-## Inputs
-
-1. name: "data" , shape: [1x3x384x128] - An input image in the format [BxCxHxW],
-   where:
-    - B - batch size
-    - C - number of channels
-    - H - image height
-    - W - image width
-
-   The expected color order is BGR.
-
-## Outputs
-
-1. The net outputs a blob with shape: [1, 256, 1, 1] named descriptor, which can be compared with other descriptors using the [Cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
-
-## Legal Information
-[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.png b/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.png
deleted file mode 100644
index 3bff7952dbe..00000000000
Binary files a/models/intel/person-reidentification-retail-0076/description/person-reidentification-retail-0076.png and /dev/null differ
diff --git a/models/intel/person-reidentification-retail-0076/model.yml b/models/intel/person-reidentification-retail-0076/model.yml
deleted file mode 100644
index 4ba53e1e8ae..00000000000
--- a/models/intel/person-reidentification-retail-0076/model.yml
+++ /dev/null
@@ -1,50 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is a person reidentification model for a general scenario. It uses a whole
-  body image as an input and outputs an embedding vector to match a pair of images
-  by the Cosine distance. The model is based on RMNet backbone that was developed
-  for fast inference. A single reidentification head from the 1/16 scale feature
-  map outputs the embedding vector of 256 floats. The model is provided without
-  last calibration layer, but can be used in the same way as the original model
-  (with insignificant drop in accuracy).
-task_type: object_attributes
-files:
-  - name: FP32/person-reidentification-retail-0076.xml
-    size: 150110
-    sha256: e918d7945e65fbc1b49c0dabe05af6bf1acde9a54d630e5eb674e08347831c91
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/FP32/person-reidentification-retail-0076.xml
-  - name: FP32/person-reidentification-retail-0076.bin
-    size: 3279064
-    sha256: acd718a8e6bd0c9e52605ecfe3f5a7ba87280976315bccc94e9302bbe520d898
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/FP32/person-reidentification-retail-0076.bin
-  - name: FP16/person-reidentification-retail-0076.xml
-    size: 149955
-    sha256: b11d33421c66bb88f6705dd504690ce5aae3118e51c782c6a8276b459175fb53
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/FP16/person-reidentification-retail-0076.xml
-  - name: FP16/person-reidentification-retail-0076.bin
-    size: 1639532
-    sha256: c8a127cb2b8ff5f26b1d248de5a07b79c916103ee39bec0825fb990e4b043fd6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/FP16/person-reidentification-retail-0076.bin
-  - name: INT8/person-reidentification-retail-0076.xml
-    size: 667125
-    sha256: 595745f9f3b5aabd62d38c569e47b3ddb5ff31c7b6ba4d5c04d7bc7c9a0384b5
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/INT8/person-reidentification-retail-0076.xml
-  - name: INT8/person-reidentification-retail-0076.bin
-    size: 3279064
-    sha256: a9ccbfa75998427553910159459d9d001b0264e02a6ee6c07e24a2a4f2f329cd
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0076/INT8/person-reidentification-retail-0076.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0076/person-reidentification-retail-0076.prototxt b/models/intel/person-reidentification-retail-0076/person-reidentification-retail-0076.prototxt
deleted file mode 100644
index 4f8592fbc49..00000000000
--- a/models/intel/person-reidentification-retail-0076/person-reidentification-retail-0076.prototxt
+++ /dev/null
@@ -1,8579 +0,0 @@
-name: "ICV-RMNet-PD-ReID-Heavy"
-layer {
-type: "Input"
-name: "data"
-top: "data"
-  input_param {
-    shape {
-      dim: 1
-      dim: 3
-      dim: 384
-      dim: 128
-    }
-  }
-}
-
-###################################################
-############### Data normalization ################
-###################################################
-
-layer {
-  name: "data/norm/bn"
-  type: "BatchNorm"
-  bottom: "data"
-  top: "data"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "data/norm/scale"
-  type: "Scale"
-  bottom: "data"
-  top: "data"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-
-###################################################
-################### Backbone ######################
-###################################################
-
-layer {
-  name: "init_block1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "data"
-  top: "init_block1/dim_inc/conv"
-  param {
-    name: "init_block1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "init_block1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "init_block1/dim_inc/scale"
-  type: "Scale"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-  param {
-    name: "init_block1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "init_block1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "init_block1/dim_inc/fn"
-  type: "ReLU"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-}
-layer {
-  name: "bottleneck1_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "init_block1/dim_inc/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    name: "bottleneck1_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    name: "bottleneck1_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    name: "bottleneck1_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    name: "bottleneck1_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    name: "bottleneck1_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    name: "bottleneck1_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/add"
-  type: "Eltwise"
-  bottom: "init_block1/dim_inc/conv"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/add"
-  top: "bottleneck1_1/add"
-}
-layer {
-  name: "bottleneck1_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/add"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    name: "bottleneck1_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    name: "bottleneck1_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    name: "bottleneck1_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    name: "bottleneck1_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    name: "bottleneck1_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    name: "bottleneck1_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_1/add"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_2/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/add"
-  top: "bottleneck1_2/add"
-}
-layer {
-  name: "bottleneck1_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/add"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    name: "bottleneck1_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    name: "bottleneck1_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    name: "bottleneck1_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    name: "bottleneck1_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    name: "bottleneck1_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    name: "bottleneck1_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_2/add"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_3/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/add"
-  top: "bottleneck1_3/add"
-}
-layer {
-  name: "bottleneck1_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/add"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    name: "bottleneck1_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    name: "bottleneck1_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    name: "bottleneck1_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    name: "bottleneck1_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    name: "bottleneck1_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    name: "bottleneck1_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_3/add"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_4/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck1_4/add"
-}
-layer {
-  name: "bottleneck2_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    name: "bottleneck2_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    name: "bottleneck2_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    name: "bottleneck2_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    name: "bottleneck2_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    name: "bottleneck2_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    name: "bottleneck2_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck2_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/skip/pooling"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    name: "bottleneck2_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/skip/conv"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/skip/conv"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    name: "bottleneck2_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_0/skip/conv"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_0/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/add"
-  top: "bottleneck2_0/add"
-}
-layer {
-  name: "bottleneck2_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/add"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    name: "bottleneck2_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    name: "bottleneck2_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    name: "bottleneck2_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    name: "bottleneck2_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    name: "bottleneck2_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    name: "bottleneck2_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_0/add"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/add"
-  top: "bottleneck2_1/add"
-}
-layer {
-  name: "bottleneck2_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/add"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    name: "bottleneck2_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    name: "bottleneck2_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    name: "bottleneck2_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    name: "bottleneck2_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    name: "bottleneck2_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    name: "bottleneck2_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_1/add"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_2/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/add"
-  top: "bottleneck2_2/add"
-}
-layer {
-  name: "bottleneck2_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/add"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    name: "bottleneck2_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    name: "bottleneck2_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    name: "bottleneck2_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    name: "bottleneck2_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    name: "bottleneck2_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    name: "bottleneck2_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_2/add"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_3/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/add"
-  top: "bottleneck2_3/add"
-}
-layer {
-  name: "bottleneck2_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/add"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    name: "bottleneck2_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    name: "bottleneck2_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    name: "bottleneck2_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    name: "bottleneck2_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    name: "bottleneck2_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    name: "bottleneck2_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_3/add"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_4/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/add"
-  top: "bottleneck2_4/add"
-}
-layer {
-  name: "bottleneck2_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/add"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    name: "bottleneck2_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    name: "bottleneck2_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    name: "bottleneck2_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    name: "bottleneck2_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    name: "bottleneck2_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    name: "bottleneck2_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_4/add"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_5/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/add"
-  top: "bottleneck2_5/add"
-}
-layer {
-  name: "bottleneck2_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/add"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    name: "bottleneck2_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    name: "bottleneck2_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    name: "bottleneck2_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    name: "bottleneck2_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    name: "bottleneck2_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    name: "bottleneck2_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_5/add"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_6/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/add"
-  top: "bottleneck2_6/add"
-}
-layer {
-  name: "bottleneck2_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/add"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    name: "bottleneck2_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    name: "bottleneck2_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    name: "bottleneck2_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    name: "bottleneck2_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    name: "bottleneck2_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    name: "bottleneck2_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_6/add"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_7/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/add"
-  top: "bottleneck2_7/add"
-}
-layer {
-  name: "bottleneck2_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/add"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    name: "bottleneck2_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    name: "bottleneck2_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    name: "bottleneck2_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    name: "bottleneck2_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    name: "bottleneck2_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    name: "bottleneck2_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_7/add"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_8/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck2_8/add"
-}
-layer {
-  name: "bottleneck3_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    name: "bottleneck3_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    name: "bottleneck3_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    name: "bottleneck3_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    name: "bottleneck3_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    name: "bottleneck3_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    name: "bottleneck3_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck3_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/skip/pooling"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    name: "bottleneck3_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/skip/conv"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/skip/conv"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    name: "bottleneck3_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_0/skip/conv"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_0/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/add"
-  top: "bottleneck3_0/add"
-}
-layer {
-  name: "bottleneck3_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/add"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    name: "bottleneck3_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    name: "bottleneck3_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    name: "bottleneck3_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    name: "bottleneck3_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    name: "bottleneck3_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    name: "bottleneck3_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_0/add"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/add"
-  top: "bottleneck3_1/add"
-}
-layer {
-  name: "bottleneck3_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/add"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    name: "bottleneck3_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    name: "bottleneck3_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    name: "bottleneck3_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    name: "bottleneck3_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    name: "bottleneck3_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    name: "bottleneck3_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_1/add"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_2/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/add"
-  top: "bottleneck3_2/add"
-}
-layer {
-  name: "bottleneck3_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/add"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    name: "bottleneck3_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    name: "bottleneck3_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    name: "bottleneck3_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    name: "bottleneck3_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    name: "bottleneck3_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    name: "bottleneck3_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_2/add"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_3/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/add"
-  top: "bottleneck3_3/add"
-}
-layer {
-  name: "bottleneck3_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/add"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    name: "bottleneck3_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    name: "bottleneck3_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    name: "bottleneck3_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    name: "bottleneck3_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    name: "bottleneck3_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    name: "bottleneck3_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_3/add"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_4/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/add"
-  top: "bottleneck3_4/add"
-}
-layer {
-  name: "bottleneck3_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/add"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    name: "bottleneck3_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    name: "bottleneck3_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    name: "bottleneck3_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    name: "bottleneck3_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    name: "bottleneck3_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    name: "bottleneck3_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_4/add"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_5/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/add"
-  top: "bottleneck3_5/add"
-}
-layer {
-  name: "bottleneck3_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/add"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    name: "bottleneck3_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    name: "bottleneck3_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    name: "bottleneck3_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    name: "bottleneck3_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    name: "bottleneck3_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    name: "bottleneck3_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_5/add"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_6/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/add"
-  top: "bottleneck3_6/add"
-}
-layer {
-  name: "bottleneck3_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/add"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    name: "bottleneck3_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    name: "bottleneck3_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    name: "bottleneck3_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    name: "bottleneck3_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    name: "bottleneck3_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    name: "bottleneck3_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_6/add"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_7/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/add"
-  top: "bottleneck3_7/add"
-}
-layer {
-  name: "bottleneck3_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/add"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    name: "bottleneck3_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    name: "bottleneck3_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    name: "bottleneck3_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    name: "bottleneck3_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    name: "bottleneck3_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    name: "bottleneck3_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_7/add"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_8/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/add"
-  top: "bottleneck3_8/add"
-}
-layer {
-  name: "bottleneck3_9/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/add"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    name: "bottleneck3_9/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    name: "bottleneck3_9/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    name: "bottleneck3_9/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    name: "bottleneck3_9/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_9/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    name: "bottleneck3_9/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    name: "bottleneck3_9/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_8/add"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_9/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/add"
-  top: "bottleneck3_9/add"
-}
-layer {
-  name: "bottleneck3_10/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/add"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    name: "bottleneck3_10/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    name: "bottleneck3_10/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    name: "bottleneck3_10/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    name: "bottleneck3_10/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_10/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    name: "bottleneck3_10/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    name: "bottleneck3_10/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_9/add"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_10/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck3_10/add"
-}
-layer {
-  name: "bottleneck4_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    name: "bottleneck4_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    name: "bottleneck4_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    name: "bottleneck4_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    name: "bottleneck4_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    name: "bottleneck4_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    name: "bottleneck4_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck4_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/skip/pooling"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    name: "bottleneck4_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/skip/conv"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/skip/conv"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    name: "bottleneck4_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_0/skip/conv"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_0/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/add"
-  top: "bottleneck4_0/add"
-}
-layer {
-  name: "bottleneck4_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/add"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    name: "bottleneck4_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    name: "bottleneck4_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    name: "bottleneck4_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    name: "bottleneck4_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    name: "bottleneck4_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    name: "bottleneck4_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_0/add"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/add"
-  top: "bottleneck4_1/add"
-}
-layer {
-  name: "bottleneck4_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/add"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    name: "bottleneck4_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    name: "bottleneck4_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    name: "bottleneck4_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    name: "bottleneck4_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    name: "bottleneck4_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    name: "bottleneck4_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_1/add"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_2/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/add"
-  top: "bottleneck4_2/add"
-}
-layer {
-  name: "bottleneck4_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/add"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    name: "bottleneck4_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    name: "bottleneck4_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    name: "bottleneck4_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    name: "bottleneck4_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    name: "bottleneck4_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    name: "bottleneck4_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_2/add"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_3/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/add"
-  top: "bottleneck4_3/add"
-}
-layer {
-  name: "bottleneck4_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/add"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    name: "bottleneck4_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    name: "bottleneck4_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    name: "bottleneck4_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    name: "bottleneck4_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    name: "bottleneck4_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    name: "bottleneck4_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_3/add"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_4/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/add"
-  top: "bottleneck4_4/add"
-}
-layer {
-  name: "bottleneck4_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/add"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    name: "bottleneck4_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    name: "bottleneck4_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    name: "bottleneck4_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    name: "bottleneck4_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    name: "bottleneck4_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    name: "bottleneck4_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_4/add"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_5/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/add"
-  top: "bottleneck4_5/add"
-}
-layer {
-  name: "bottleneck4_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/add"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    name: "bottleneck4_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    name: "bottleneck4_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    name: "bottleneck4_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    name: "bottleneck4_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    name: "bottleneck4_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    name: "bottleneck4_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_5/add"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_6/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/add"
-  top: "bottleneck4_6/add"
-}
-layer {
-  name: "bottleneck4_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/add"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    name: "bottleneck4_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    name: "bottleneck4_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    name: "bottleneck4_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    name: "bottleneck4_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    name: "bottleneck4_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    name: "bottleneck4_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_6/add"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_7/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/add"
-  top: "bottleneck4_7/add"
-}
-layer {
-  name: "bottleneck4_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/add"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    name: "bottleneck4_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    name: "bottleneck4_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    name: "bottleneck4_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    name: "bottleneck4_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    name: "bottleneck4_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    name: "bottleneck4_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_7/add"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_8/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/add"
-  top: "bottleneck4_8/add"
-}
-layer {
-  name: "bottleneck4_9/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/add"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    name: "bottleneck4_9/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    name: "bottleneck4_9/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    name: "bottleneck4_9/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    name: "bottleneck4_9/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_9/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    name: "bottleneck4_9/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    name: "bottleneck4_9/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_8/add"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_9/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/add"
-  top: "bottleneck4_9/add"
-}
-layer {
-  name: "bottleneck4_10/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/add"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    name: "bottleneck4_10/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    name: "bottleneck4_10/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    name: "bottleneck4_10/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    name: "bottleneck4_10/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_10/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    name: "bottleneck4_10/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    name: "bottleneck4_10/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_9/add"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_10/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/add"
-  top: "bottleneck4_10/add"
-}
-layer {
-  name: "bottleneck4_11/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/add"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    name: "bottleneck4_11/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    name: "bottleneck4_11/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    name: "bottleneck4_11/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    name: "bottleneck4_11/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_11/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    name: "bottleneck4_11/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    name: "bottleneck4_11/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_10/add"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_11/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/add"
-  top: "bottleneck4_11/add"
-}
-
-###################################################
-################# Embedding Head ##################
-###################################################
-
-layer {
-  name: "pooling/out"
-  type: "Pooling"
-  bottom: "bottleneck4_11/add"
-  top: "pooling/out"
-  pooling_param {
-    pool: MAX
-    global_pooling: true
-  }
-}
-layer {
-  name: "embd/dim_inc/conv"
-  type: "Convolution"
-  bottom: "pooling/out"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 1.0
-  }
-  convolution_param {
-    num_output: 512
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "embd/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "embd/dim_inc/scale"
-  type: "Scale"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-layer {
-  name: "embd/dim_inc/fn"
-  type: "ELU"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-}
-
-layer {
-  name: "embd/dim_red/conv"
-  type: "Convolution"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 1.0
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "embd/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "embd/dim_red/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "embd/dim_red/scale"
-  type: "Scale"
-  bottom: "embd/dim_red/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-
diff --git a/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.md b/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.md
deleted file mode 100644
index 9224101cc1b..00000000000
--- a/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# person-reidentification-retail-0079
-
-## Use Case and High-Level Description
-
-This is a person reidentification model for a general scenario. It uses a whole body image as an input and outputs an embedding vector to match a pair of images by the Cosine distance. The model is based on RMNet backbone that was developed for fast inference. A single reidentification head from the 1/16 scale feature map outputs the embedding vector of 256 floats. The model is provided without last calibration layer, but can be used in the same way as the original model (with insignificant drop in accuracy).
-
-## Example
-
-![](./person-reidentification-retail-0079.png)
-
-## Specification
-
-| Metric                            | Value                                     |
-|-----------------------------------|-------------------------------------------|
-| Market-1501 rank@1 accuracy       | 0.9166                                    |
-| Market-1501 mAP                   | 0.8163                                    |
-| Pose coverage                     | Standing upright, parallel to image plane |
-| Support of occluded pedestrians   | YES                                       |
-| Occlusion coverage                | <50%                                      |
-| GFlops                            | 0.124                                     |
-| MParams                           | 0.820                                     |
-| Source framework                  | Caffe*                                    |
-
-The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility to locate at least one true positive in the top-1 rank.
-Mean Average Precision (mAP) is the mean across all queries’ Average Precision (AP) and AP is defined as an area under the [precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
-
-## Performance
-
-## Inputs
-
-1. name: "data" , shape: [1x3x160x64] - An input image in the format [BxCxHxW],
-   where:
-    - B - batch size
-    - C - number of channels
-    - H - image height
-    - W - image width
-
-   The expected color order is BGR.
-
-## Outputs
-
-1. The net outputs a blob with shape: [1, 256, 1, 1] named descriptor, which can be compared with other descriptors using the [Cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
-
-## Legal Information
-[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.png b/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.png
deleted file mode 100644
index 3bff7952dbe..00000000000
Binary files a/models/intel/person-reidentification-retail-0079/description/person-reidentification-retail-0079.png and /dev/null differ
diff --git a/models/intel/person-reidentification-retail-0079/model.yml b/models/intel/person-reidentification-retail-0079/model.yml
deleted file mode 100644
index 7bb38764828..00000000000
--- a/models/intel/person-reidentification-retail-0079/model.yml
+++ /dev/null
@@ -1,50 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is a person reidentification model for a general scenario. It uses a whole
-  body image as an input and outputs an embedding vector to match a pair of images
-  by the Cosine distance. The model is based on RMNet backbone that was developed
-  for fast inference. A single reidentification head from the 1/16 scale feature
-  map outputs the embedding vector of 256 floats. The model is provided without
-  last calibration layer, but can be used in the same way as the original model
-  (with insignificant drop in accuracy).
-task_type: object_attributes
-files:
-  - name: FP32/person-reidentification-retail-0079.xml
-    size: 149868
-    sha256: 8c136d4127830502c1e7dab745908e5982711dd86eb2f0cbe746d4255baef097
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.xml
-  - name: FP32/person-reidentification-retail-0079.bin
-    size: 3279064
-    sha256: e341d80b568d939dc121d2c4785d1f8bc90df477cd1754d0b286b2e24b7b33e4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.bin
-  - name: FP16/person-reidentification-retail-0079.xml
-    size: 149713
-    sha256: 08193544792d4cbd456ae2b7f3850d77346b810b63c622db3e33c08651bc17b6
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/FP16/person-reidentification-retail-0079.xml
-  - name: FP16/person-reidentification-retail-0079.bin
-    size: 1639532
-    sha256: 95c426b1d7e8f06f417172f5b1058bd906c769c8c10b3846f8b3adc826390d93
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/FP16/person-reidentification-retail-0079.bin
-  - name: INT8/person-reidentification-retail-0079.xml
-    size: 665546
-    sha256: 99c72f383c8eea05387adb64a18027ebfad57c267e07626cc7181df6c74a95e7
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/INT8/person-reidentification-retail-0079.xml
-  - name: INT8/person-reidentification-retail-0079.bin
-    size: 3279064
-    sha256: ebbf0d88705e371e0f7f3abea5c889958da1e87c265a605a33d6e155d46f3658
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-reidentification-retail-0079/INT8/person-reidentification-retail-0079.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0079/person-reidentification-retail-0079.prototxt b/models/intel/person-reidentification-retail-0079/person-reidentification-retail-0079.prototxt
deleted file mode 100644
index c8544d76cf8..00000000000
--- a/models/intel/person-reidentification-retail-0079/person-reidentification-retail-0079.prototxt
+++ /dev/null
@@ -1,8579 +0,0 @@
-name: "ICV-RMNet-PD-ReID-Middle"
-layer {
-type: "Input"
-name: "data"
-top: "data"
-  input_param {
-    shape {
-      dim: 1
-      dim: 3
-      dim: 160
-      dim: 64
-    }
-  }
-}
-
-###################################################
-############### Data normalization ################
-###################################################
-
-layer {
-  name: "data/norm/bn"
-  type: "BatchNorm"
-  bottom: "data"
-  top: "data"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "data/norm/scale"
-  type: "Scale"
-  bottom: "data"
-  top: "data"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-
-###################################################
-################### Backbone ######################
-###################################################
-
-layer {
-  name: "init_block1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "data"
-  top: "init_block1/dim_inc/conv"
-  param {
-    name: "init_block1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "init_block1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "init_block1/dim_inc/scale"
-  type: "Scale"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-  param {
-    name: "init_block1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "init_block1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "init_block1/dim_inc/fn"
-  type: "ReLU"
-  bottom: "init_block1/dim_inc/conv"
-  top: "init_block1/dim_inc/conv"
-}
-layer {
-  name: "bottleneck1_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "init_block1/dim_inc/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    name: "bottleneck1_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-  param {
-    name: "bottleneck1_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/dim_red/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    name: "bottleneck1_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-  param {
-    name: "bottleneck1_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/inner/dw1/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    name: "bottleneck1_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/dim_inc/conv"
-  param {
-    name: "bottleneck1_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_1/add"
-  type: "Eltwise"
-  bottom: "init_block1/dim_inc/conv"
-  bottom: "bottleneck1_1/dim_inc/conv"
-  top: "bottleneck1_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_1/add"
-  top: "bottleneck1_1/add"
-}
-layer {
-  name: "bottleneck1_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_1/add"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    name: "bottleneck1_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-  param {
-    name: "bottleneck1_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/dim_red/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    name: "bottleneck1_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-  param {
-    name: "bottleneck1_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/inner/dw1/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    name: "bottleneck1_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/dim_inc/conv"
-  param {
-    name: "bottleneck1_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_1/add"
-  bottom: "bottleneck1_2/dim_inc/conv"
-  top: "bottleneck1_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_2/fn"
-  type: "ELU"
-  bottom: "bottleneck1_2/add"
-  top: "bottleneck1_2/add"
-}
-layer {
-  name: "bottleneck1_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_2/add"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    name: "bottleneck1_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-  param {
-    name: "bottleneck1_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/dim_red/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    name: "bottleneck1_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-  param {
-    name: "bottleneck1_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/inner/dw1/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    name: "bottleneck1_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/dim_inc/conv"
-  param {
-    name: "bottleneck1_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_2/add"
-  bottom: "bottleneck1_3/dim_inc/conv"
-  top: "bottleneck1_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_3/fn"
-  type: "ELU"
-  bottom: "bottleneck1_3/add"
-  top: "bottleneck1_3/add"
-}
-layer {
-  name: "bottleneck1_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_3/add"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    name: "bottleneck1_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-  param {
-    name: "bottleneck1_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/dim_red/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    name: "bottleneck1_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 8
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 8
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-  param {
-    name: "bottleneck1_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck1_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/inner/dw1/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    name: "bottleneck1_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck1_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/dim_inc/conv"
-  param {
-    name: "bottleneck1_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck1_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck1_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck1_3/add"
-  bottom: "bottleneck1_4/dim_inc/conv"
-  top: "bottleneck1_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck1_4/fn"
-  type: "ELU"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck1_4/add"
-}
-layer {
-  name: "bottleneck2_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    name: "bottleneck2_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-  param {
-    name: "bottleneck2_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/dim_red/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    name: "bottleneck2_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-  param {
-    name: "bottleneck2_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/inner/dw1/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    name: "bottleneck2_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/dim_inc/conv"
-  param {
-    name: "bottleneck2_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck1_4/add"
-  top: "bottleneck2_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/skip/pooling"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    name: "bottleneck2_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_0/skip/conv"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck2_0/skip/conv"
-  top: "bottleneck2_0/skip/conv"
-  param {
-    name: "bottleneck2_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_0/skip/conv"
-  bottom: "bottleneck2_0/dim_inc/conv"
-  top: "bottleneck2_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_0/fn"
-  type: "ELU"
-  bottom: "bottleneck2_0/add"
-  top: "bottleneck2_0/add"
-}
-layer {
-  name: "bottleneck2_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_0/add"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    name: "bottleneck2_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-  param {
-    name: "bottleneck2_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/dim_red/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    name: "bottleneck2_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-  param {
-    name: "bottleneck2_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/inner/dw1/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    name: "bottleneck2_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/dim_inc/conv"
-  param {
-    name: "bottleneck2_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_0/add"
-  bottom: "bottleneck2_1/dim_inc/conv"
-  top: "bottleneck2_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_1/add"
-  top: "bottleneck2_1/add"
-}
-layer {
-  name: "bottleneck2_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_1/add"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    name: "bottleneck2_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-  param {
-    name: "bottleneck2_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/dim_red/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    name: "bottleneck2_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-  param {
-    name: "bottleneck2_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/inner/dw1/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    name: "bottleneck2_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/dim_inc/conv"
-  param {
-    name: "bottleneck2_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_1/add"
-  bottom: "bottleneck2_2/dim_inc/conv"
-  top: "bottleneck2_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_2/fn"
-  type: "ELU"
-  bottom: "bottleneck2_2/add"
-  top: "bottleneck2_2/add"
-}
-layer {
-  name: "bottleneck2_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_2/add"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    name: "bottleneck2_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-  param {
-    name: "bottleneck2_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/dim_red/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    name: "bottleneck2_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-  param {
-    name: "bottleneck2_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/inner/dw1/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    name: "bottleneck2_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/dim_inc/conv"
-  param {
-    name: "bottleneck2_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_2/add"
-  bottom: "bottleneck2_3/dim_inc/conv"
-  top: "bottleneck2_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_3/fn"
-  type: "ELU"
-  bottom: "bottleneck2_3/add"
-  top: "bottleneck2_3/add"
-}
-layer {
-  name: "bottleneck2_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_3/add"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    name: "bottleneck2_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-  param {
-    name: "bottleneck2_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/dim_red/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    name: "bottleneck2_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-  param {
-    name: "bottleneck2_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/inner/dw1/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    name: "bottleneck2_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/dim_inc/conv"
-  param {
-    name: "bottleneck2_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_3/add"
-  bottom: "bottleneck2_4/dim_inc/conv"
-  top: "bottleneck2_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_4/fn"
-  type: "ELU"
-  bottom: "bottleneck2_4/add"
-  top: "bottleneck2_4/add"
-}
-layer {
-  name: "bottleneck2_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_4/add"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    name: "bottleneck2_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-  param {
-    name: "bottleneck2_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/dim_red/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    name: "bottleneck2_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-  param {
-    name: "bottleneck2_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/inner/dw1/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    name: "bottleneck2_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/dim_inc/conv"
-  param {
-    name: "bottleneck2_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_4/add"
-  bottom: "bottleneck2_5/dim_inc/conv"
-  top: "bottleneck2_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_5/fn"
-  type: "ELU"
-  bottom: "bottleneck2_5/add"
-  top: "bottleneck2_5/add"
-}
-layer {
-  name: "bottleneck2_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_5/add"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    name: "bottleneck2_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-  param {
-    name: "bottleneck2_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/dim_red/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    name: "bottleneck2_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-  param {
-    name: "bottleneck2_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/inner/dw1/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    name: "bottleneck2_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/dim_inc/conv"
-  param {
-    name: "bottleneck2_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_5/add"
-  bottom: "bottleneck2_6/dim_inc/conv"
-  top: "bottleneck2_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_6/fn"
-  type: "ELU"
-  bottom: "bottleneck2_6/add"
-  top: "bottleneck2_6/add"
-}
-layer {
-  name: "bottleneck2_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_6/add"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    name: "bottleneck2_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-  param {
-    name: "bottleneck2_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/dim_red/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    name: "bottleneck2_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-  param {
-    name: "bottleneck2_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/inner/dw1/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    name: "bottleneck2_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/dim_inc/conv"
-  param {
-    name: "bottleneck2_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_6/add"
-  bottom: "bottleneck2_7/dim_inc/conv"
-  top: "bottleneck2_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_7/fn"
-  type: "ELU"
-  bottom: "bottleneck2_7/add"
-  top: "bottleneck2_7/add"
-}
-layer {
-  name: "bottleneck2_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_7/add"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    name: "bottleneck2_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-  param {
-    name: "bottleneck2_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/dim_red/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    name: "bottleneck2_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 16
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 16
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-  param {
-    name: "bottleneck2_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck2_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/inner/dw1/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    name: "bottleneck2_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck2_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/dim_inc/conv"
-  param {
-    name: "bottleneck2_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck2_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck2_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck2_7/add"
-  bottom: "bottleneck2_8/dim_inc/conv"
-  top: "bottleneck2_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck2_8/fn"
-  type: "ELU"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck2_8/add"
-}
-layer {
-  name: "bottleneck3_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    name: "bottleneck3_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-  param {
-    name: "bottleneck3_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/dim_red/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    name: "bottleneck3_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-  param {
-    name: "bottleneck3_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/inner/dw1/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    name: "bottleneck3_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/dim_inc/conv"
-  param {
-    name: "bottleneck3_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck2_8/add"
-  top: "bottleneck3_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/skip/pooling"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    name: "bottleneck3_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_0/skip/conv"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck3_0/skip/conv"
-  top: "bottleneck3_0/skip/conv"
-  param {
-    name: "bottleneck3_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_0/skip/conv"
-  bottom: "bottleneck3_0/dim_inc/conv"
-  top: "bottleneck3_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_0/fn"
-  type: "ELU"
-  bottom: "bottleneck3_0/add"
-  top: "bottleneck3_0/add"
-}
-layer {
-  name: "bottleneck3_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_0/add"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    name: "bottleneck3_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-  param {
-    name: "bottleneck3_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/dim_red/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    name: "bottleneck3_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-  param {
-    name: "bottleneck3_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/inner/dw1/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    name: "bottleneck3_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/dim_inc/conv"
-  param {
-    name: "bottleneck3_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_0/add"
-  bottom: "bottleneck3_1/dim_inc/conv"
-  top: "bottleneck3_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_1/add"
-  top: "bottleneck3_1/add"
-}
-layer {
-  name: "bottleneck3_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_1/add"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    name: "bottleneck3_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-  param {
-    name: "bottleneck3_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/dim_red/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    name: "bottleneck3_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-  param {
-    name: "bottleneck3_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/inner/dw1/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    name: "bottleneck3_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/dim_inc/conv"
-  param {
-    name: "bottleneck3_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_1/add"
-  bottom: "bottleneck3_2/dim_inc/conv"
-  top: "bottleneck3_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_2/fn"
-  type: "ELU"
-  bottom: "bottleneck3_2/add"
-  top: "bottleneck3_2/add"
-}
-layer {
-  name: "bottleneck3_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_2/add"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    name: "bottleneck3_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-  param {
-    name: "bottleneck3_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/dim_red/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    name: "bottleneck3_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-  param {
-    name: "bottleneck3_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/inner/dw1/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    name: "bottleneck3_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/dim_inc/conv"
-  param {
-    name: "bottleneck3_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_2/add"
-  bottom: "bottleneck3_3/dim_inc/conv"
-  top: "bottleneck3_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_3/fn"
-  type: "ELU"
-  bottom: "bottleneck3_3/add"
-  top: "bottleneck3_3/add"
-}
-layer {
-  name: "bottleneck3_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_3/add"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    name: "bottleneck3_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-  param {
-    name: "bottleneck3_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/dim_red/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    name: "bottleneck3_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-  param {
-    name: "bottleneck3_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/inner/dw1/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    name: "bottleneck3_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/dim_inc/conv"
-  param {
-    name: "bottleneck3_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_3/add"
-  bottom: "bottleneck3_4/dim_inc/conv"
-  top: "bottleneck3_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_4/fn"
-  type: "ELU"
-  bottom: "bottleneck3_4/add"
-  top: "bottleneck3_4/add"
-}
-layer {
-  name: "bottleneck3_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_4/add"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    name: "bottleneck3_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-  param {
-    name: "bottleneck3_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/dim_red/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    name: "bottleneck3_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-  param {
-    name: "bottleneck3_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/inner/dw1/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    name: "bottleneck3_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/dim_inc/conv"
-  param {
-    name: "bottleneck3_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_4/add"
-  bottom: "bottleneck3_5/dim_inc/conv"
-  top: "bottleneck3_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_5/fn"
-  type: "ELU"
-  bottom: "bottleneck3_5/add"
-  top: "bottleneck3_5/add"
-}
-layer {
-  name: "bottleneck3_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_5/add"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    name: "bottleneck3_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-  param {
-    name: "bottleneck3_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/dim_red/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    name: "bottleneck3_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-  param {
-    name: "bottleneck3_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/inner/dw1/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    name: "bottleneck3_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/dim_inc/conv"
-  param {
-    name: "bottleneck3_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_5/add"
-  bottom: "bottleneck3_6/dim_inc/conv"
-  top: "bottleneck3_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_6/fn"
-  type: "ELU"
-  bottom: "bottleneck3_6/add"
-  top: "bottleneck3_6/add"
-}
-layer {
-  name: "bottleneck3_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_6/add"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    name: "bottleneck3_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-  param {
-    name: "bottleneck3_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/dim_red/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    name: "bottleneck3_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-  param {
-    name: "bottleneck3_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/inner/dw1/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    name: "bottleneck3_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/dim_inc/conv"
-  param {
-    name: "bottleneck3_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_6/add"
-  bottom: "bottleneck3_7/dim_inc/conv"
-  top: "bottleneck3_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_7/fn"
-  type: "ELU"
-  bottom: "bottleneck3_7/add"
-  top: "bottleneck3_7/add"
-}
-layer {
-  name: "bottleneck3_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_7/add"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    name: "bottleneck3_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-  param {
-    name: "bottleneck3_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/dim_red/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    name: "bottleneck3_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-  param {
-    name: "bottleneck3_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/inner/dw1/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    name: "bottleneck3_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/dim_inc/conv"
-  param {
-    name: "bottleneck3_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_7/add"
-  bottom: "bottleneck3_8/dim_inc/conv"
-  top: "bottleneck3_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_8/fn"
-  type: "ELU"
-  bottom: "bottleneck3_8/add"
-  top: "bottleneck3_8/add"
-}
-layer {
-  name: "bottleneck3_9/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_8/add"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    name: "bottleneck3_9/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-  param {
-    name: "bottleneck3_9/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/dim_red/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    name: "bottleneck3_9/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-  param {
-    name: "bottleneck3_9/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_9/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/inner/dw1/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    name: "bottleneck3_9/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_9/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/dim_inc/conv"
-  param {
-    name: "bottleneck3_9/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_9/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_9/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_8/add"
-  bottom: "bottleneck3_9/dim_inc/conv"
-  top: "bottleneck3_9/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_9/fn"
-  type: "ELU"
-  bottom: "bottleneck3_9/add"
-  top: "bottleneck3_9/add"
-}
-layer {
-  name: "bottleneck3_10/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_9/add"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    name: "bottleneck3_10/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-  param {
-    name: "bottleneck3_10/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/dim_red/conv"
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/dim_red/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    name: "bottleneck3_10/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 32
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 32
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-  param {
-    name: "bottleneck3_10/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck3_10/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/inner/dw1/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    name: "bottleneck3_10/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 128
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck3_10/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/dim_inc/conv"
-  param {
-    name: "bottleneck3_10/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck3_10/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck3_10/add"
-  type: "Eltwise"
-  bottom: "bottleneck3_9/add"
-  bottom: "bottleneck3_10/dim_inc/conv"
-  top: "bottleneck3_10/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck3_10/fn"
-  type: "ELU"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck3_10/add"
-}
-layer {
-  name: "bottleneck4_0/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    name: "bottleneck4_0/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-  param {
-    name: "bottleneck4_0/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/dim_red/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    name: "bottleneck4_0/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 2
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-  param {
-    name: "bottleneck4_0/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_0/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/inner/dw1/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    name: "bottleneck4_0/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/dim_inc/conv"
-  param {
-    name: "bottleneck4_0/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/pooling"
-  type: "Pooling"
-  bottom: "bottleneck3_10/add"
-  top: "bottleneck4_0/skip/pooling"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-    pad: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/skip/pooling"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    name: "bottleneck4_0/skip/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_0/skip/conv"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_0/skip/scale"
-  type: "Scale"
-  bottom: "bottleneck4_0/skip/conv"
-  top: "bottleneck4_0/skip/conv"
-  param {
-    name: "bottleneck4_0/skip/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_0/skip/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_0/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_0/skip/conv"
-  bottom: "bottleneck4_0/dim_inc/conv"
-  top: "bottleneck4_0/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_0/fn"
-  type: "ELU"
-  bottom: "bottleneck4_0/add"
-  top: "bottleneck4_0/add"
-}
-layer {
-  name: "bottleneck4_1/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_0/add"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    name: "bottleneck4_1/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-  param {
-    name: "bottleneck4_1/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/dim_red/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    name: "bottleneck4_1/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-  param {
-    name: "bottleneck4_1/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_1/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/inner/dw1/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    name: "bottleneck4_1/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_1/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/dim_inc/conv"
-  param {
-    name: "bottleneck4_1/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_1/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_1/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_0/add"
-  bottom: "bottleneck4_1/dim_inc/conv"
-  top: "bottleneck4_1/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_1/add"
-  top: "bottleneck4_1/add"
-}
-layer {
-  name: "bottleneck4_2/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_1/add"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    name: "bottleneck4_2/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-  param {
-    name: "bottleneck4_2/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/dim_red/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    name: "bottleneck4_2/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-  param {
-    name: "bottleneck4_2/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_2/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/inner/dw1/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    name: "bottleneck4_2/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_2/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/dim_inc/conv"
-  param {
-    name: "bottleneck4_2/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_2/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_2/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_1/add"
-  bottom: "bottleneck4_2/dim_inc/conv"
-  top: "bottleneck4_2/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_2/fn"
-  type: "ELU"
-  bottom: "bottleneck4_2/add"
-  top: "bottleneck4_2/add"
-}
-layer {
-  name: "bottleneck4_3/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_2/add"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    name: "bottleneck4_3/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-  param {
-    name: "bottleneck4_3/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/dim_red/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    name: "bottleneck4_3/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-  param {
-    name: "bottleneck4_3/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_3/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/inner/dw1/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    name: "bottleneck4_3/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_3/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/dim_inc/conv"
-  param {
-    name: "bottleneck4_3/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_3/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_3/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_2/add"
-  bottom: "bottleneck4_3/dim_inc/conv"
-  top: "bottleneck4_3/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_3/fn"
-  type: "ELU"
-  bottom: "bottleneck4_3/add"
-  top: "bottleneck4_3/add"
-}
-layer {
-  name: "bottleneck4_4/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_3/add"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    name: "bottleneck4_4/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-  param {
-    name: "bottleneck4_4/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/dim_red/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    name: "bottleneck4_4/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-  param {
-    name: "bottleneck4_4/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_4/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/inner/dw1/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    name: "bottleneck4_4/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_4/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/dim_inc/conv"
-  param {
-    name: "bottleneck4_4/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_4/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_4/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_3/add"
-  bottom: "bottleneck4_4/dim_inc/conv"
-  top: "bottleneck4_4/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_4/fn"
-  type: "ELU"
-  bottom: "bottleneck4_4/add"
-  top: "bottleneck4_4/add"
-}
-layer {
-  name: "bottleneck4_5/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_4/add"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    name: "bottleneck4_5/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-  param {
-    name: "bottleneck4_5/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/dim_red/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    name: "bottleneck4_5/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-  param {
-    name: "bottleneck4_5/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_5/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/inner/dw1/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    name: "bottleneck4_5/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_5/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/dim_inc/conv"
-  param {
-    name: "bottleneck4_5/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_5/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_5/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_4/add"
-  bottom: "bottleneck4_5/dim_inc/conv"
-  top: "bottleneck4_5/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_5/fn"
-  type: "ELU"
-  bottom: "bottleneck4_5/add"
-  top: "bottleneck4_5/add"
-}
-layer {
-  name: "bottleneck4_6/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_5/add"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    name: "bottleneck4_6/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-  param {
-    name: "bottleneck4_6/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/dim_red/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    name: "bottleneck4_6/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-  param {
-    name: "bottleneck4_6/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_6/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/inner/dw1/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    name: "bottleneck4_6/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_6/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/dim_inc/conv"
-  param {
-    name: "bottleneck4_6/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_6/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_6/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_5/add"
-  bottom: "bottleneck4_6/dim_inc/conv"
-  top: "bottleneck4_6/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_6/fn"
-  type: "ELU"
-  bottom: "bottleneck4_6/add"
-  top: "bottleneck4_6/add"
-}
-layer {
-  name: "bottleneck4_7/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_6/add"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    name: "bottleneck4_7/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-  param {
-    name: "bottleneck4_7/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/dim_red/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    name: "bottleneck4_7/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-  param {
-    name: "bottleneck4_7/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_7/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/inner/dw1/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    name: "bottleneck4_7/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_7/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/dim_inc/conv"
-  param {
-    name: "bottleneck4_7/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_7/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_7/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_6/add"
-  bottom: "bottleneck4_7/dim_inc/conv"
-  top: "bottleneck4_7/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_7/fn"
-  type: "ELU"
-  bottom: "bottleneck4_7/add"
-  top: "bottleneck4_7/add"
-}
-layer {
-  name: "bottleneck4_8/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_7/add"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    name: "bottleneck4_8/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-  param {
-    name: "bottleneck4_8/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/dim_red/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    name: "bottleneck4_8/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-  param {
-    name: "bottleneck4_8/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_8/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/inner/dw1/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    name: "bottleneck4_8/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_8/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/dim_inc/conv"
-  param {
-    name: "bottleneck4_8/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_8/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_8/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_7/add"
-  bottom: "bottleneck4_8/dim_inc/conv"
-  top: "bottleneck4_8/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_8/fn"
-  type: "ELU"
-  bottom: "bottleneck4_8/add"
-  top: "bottleneck4_8/add"
-}
-layer {
-  name: "bottleneck4_9/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_8/add"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    name: "bottleneck4_9/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-  param {
-    name: "bottleneck4_9/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/dim_red/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    name: "bottleneck4_9/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-  param {
-    name: "bottleneck4_9/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_9/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/inner/dw1/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    name: "bottleneck4_9/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_9/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/dim_inc/conv"
-  param {
-    name: "bottleneck4_9/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_9/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_9/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_8/add"
-  bottom: "bottleneck4_9/dim_inc/conv"
-  top: "bottleneck4_9/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_9/fn"
-  type: "ELU"
-  bottom: "bottleneck4_9/add"
-  top: "bottleneck4_9/add"
-}
-layer {
-  name: "bottleneck4_10/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_9/add"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    name: "bottleneck4_10/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-  param {
-    name: "bottleneck4_10/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/dim_red/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    name: "bottleneck4_10/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-  param {
-    name: "bottleneck4_10/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_10/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/inner/dw1/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    name: "bottleneck4_10/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_10/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/dim_inc/conv"
-  param {
-    name: "bottleneck4_10/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_10/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_10/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_9/add"
-  bottom: "bottleneck4_10/dim_inc/conv"
-  top: "bottleneck4_10/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_10/fn"
-  type: "ELU"
-  bottom: "bottleneck4_10/add"
-  top: "bottleneck4_10/add"
-}
-layer {
-  name: "bottleneck4_11/dim_red/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_10/add"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    name: "bottleneck4_11/dim_red/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-  param {
-    name: "bottleneck4_11/dim_red/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/dim_red/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_red/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/dim_red/conv"
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_11/dim_red/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    name: "bottleneck4_11/inner/dw1/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 64
-    bias_term: false
-    pad: 1
-    kernel_size: 3
-    group: 64
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-  param {
-    name: "bottleneck4_11/inner/dw1/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/inner/dw1/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/inner/dw1/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/inner/dw1/conv"
-}
-layer {
-  name: "bottleneck4_11/dim_inc/conv"
-  type: "Convolution"
-  bottom: "bottleneck4_11/inner/dw1/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    name: "bottleneck4_11/dim_inc/conv/w"
-    lr_mult: 1
-    decay_mult: 1
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-  param {
-    lr_mult: 0
-    decay_mult: 0
-  }
-}
-layer {
-  name: "bottleneck4_11/dim_inc/scale"
-  type: "Scale"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/dim_inc/conv"
-  param {
-    name: "bottleneck4_11/dim_inc/scale/a"
-    lr_mult: 1
-    decay_mult: 0
-  }
-  param {
-    name: "bottleneck4_11/dim_inc/scale/b"
-    lr_mult: 2
-    decay_mult: 0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1
-    }
-    bias_term: true
-    bias_filler {
-      value: 0
-    }
-  }
-}
-layer {
-  name: "bottleneck4_11/add"
-  type: "Eltwise"
-  bottom: "bottleneck4_10/add"
-  bottom: "bottleneck4_11/dim_inc/conv"
-  top: "bottleneck4_11/add"
-  eltwise_param {
-    operation: SUM
-  }
-}
-layer {
-  name: "bottleneck4_11/fn"
-  type: "ELU"
-  bottom: "bottleneck4_11/add"
-  top: "bottleneck4_11/add"
-}
-
-###################################################
-################# Embedding Head ##################
-###################################################
-
-layer {
-  name: "pooling/out"
-  type: "Pooling"
-  bottom: "bottleneck4_11/add"
-  top: "pooling/out"
-  pooling_param {
-    pool: MAX
-    global_pooling: true
-  }
-}
-layer {
-  name: "embd/dim_inc/conv"
-  type: "Convolution"
-  bottom: "pooling/out"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 1.0
-  }
-  convolution_param {
-    num_output: 512
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "embd/dim_inc/bn"
-  type: "BatchNorm"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "embd/dim_inc/scale"
-  type: "Scale"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-layer {
-  name: "embd/dim_inc/fn"
-  type: "ELU"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_inc/conv"
-}
-
-layer {
-  name: "embd/dim_red/conv"
-  type: "Convolution"
-  bottom: "embd/dim_inc/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 1.0
-  }
-  convolution_param {
-    num_output: 256
-    bias_term: false
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "msra"
-    }
-  }
-}
-layer {
-  name: "embd/dim_red/bn"
-  type: "BatchNorm"
-  bottom: "embd/dim_red/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 0.0
-    decay_mult: 0.0
-  }
-}
-layer {
-  name: "embd/dim_red/scale"
-  type: "Scale"
-  bottom: "embd/dim_red/conv"
-  top: "embd/dim_red/conv"
-  param {
-    lr_mult: 1.0
-    decay_mult: 0.0
-  }
-  param {
-    lr_mult: 2.0
-    decay_mult: 0.0
-  }
-  scale_param {
-    axis: 1
-    filler {
-      value: 1.0
-    }
-    bias_term: true
-    bias_filler {
-      value: 0.0
-    }
-  }
-}
-
diff --git a/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.jpg b/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.jpg
new file mode 100644
index 00000000000..4e0db3f5e06
Binary files /dev/null and b/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.jpg differ
diff --git a/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.md b/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.md
new file mode 100644
index 00000000000..2c1bbedfe04
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0103/description/person-reidentification-retail-0103.md
@@ -0,0 +1,53 @@
+# person-reidentification-retail-0103
+
+## Use Case and High-Level Description
+
+This is a person reidentification model for a general scenario. It uses a whole
+body image as an input and outputs an embedding vector to match a pair of images
+by the cosine distance. The model is based on the OmniScaleNet backbone developed for fast inference.
+A single reidentification head from the 1/16 scale
+feature map outputs an embedding vector of 256 floats.
+
+## Example
+
+![](./person-reidentification-retail-0103.jpg)
+
+## Specification
+
+| Metric                            | Value                                     |
+|-----------------------------------|-------------------------------------------|
+| GlobalMe-reID rank@1 accuracy     | 93.5%                                     |
+| GlobalMe-reID mAP                 | 69.5%                                     |
+| Pose coverage                     | Standing upright, parallel to image plane |
+| Support of occluded pedestrians   | YES                                       |
+| Occlusion coverage                | <50%                                      |
+| GFlops                            | 0.564                                     |
+| MParams                           | 0.597                                     |
+| Source framework                  | PyTorch\*                                 |
+
+The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility
+to locate at least one true positive in the top-1 rank.
+Mean Average Precision (mAP) is the mean across Average Precision (AP) of all queries. 
+AP is defined as the area under the
+[precision and recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
+
+## Performance
+
+## Inputs
+
+The net expects one input image of the shape [1x3x256x128] with the [BxCxHxW] format, where:
+- B - batch size
+- C - number of channels
+- H - image height
+- W - image width
+
+The expected color order is BGR.
+
+## Outputs
+
+The net outputs a blob with the [1, 256] shape named `descriptor`, which can be
+compared with other descriptors using the
+[cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0103/model.yml b/models/intel/person-reidentification-retail-0103/model.yml
new file mode 100644
index 00000000000..07971606eba
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0103/model.yml
@@ -0,0 +1,45 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Single embedding-based person reidentification model (the model is trade-off between
+  performance and accuracy)
+task_type: object_attributes
+files:
+  - name: FP32/person-reidentification-retail-0103.xml
+    size: 429052
+    sha256: 850dbc1d53901c0e36c101fddfb8999647b588f791e55ca021b85963ce0e28e9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP32/person-reidentification-retail-0103.xml
+  - name: FP32/person-reidentification-retail-0103.bin
+    size: 2365244
+    sha256: 816f560505526a0c8d4b66d0629c0bd00f5df201fb76186e860851521bf14f91
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP32/person-reidentification-retail-0103.bin
+  - name: FP16/person-reidentification-retail-0103.xml
+    size: 428746
+    sha256: 2ffb7e9d60159f2cff0375a83362ce60131692f4835129c7debb3417425e5889
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP16/person-reidentification-retail-0103.xml
+  - name: FP16/person-reidentification-retail-0103.bin
+    size: 1182656
+    sha256: e17a3a323cf771918350d777d9398143e7ad8a6b404eb294b67ee2a837f36cae
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP16/person-reidentification-retail-0103.bin
+  - name: FP32-INT8/person-reidentification-retail-0103.xml
+    size: 1215718
+    sha256: 62fea19cd7ee93cbb3b2d262a09ce5a7ff3b801fead28e79de84f1bbfbcd18ce
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP32-INT8/person-reidentification-retail-0103.xml
+  - name: FP32-INT8/person-reidentification-retail-0103.bin
+    size: 2462604
+    sha256: 8f4f8e74a869847f2cdb2bea0fba6027977c16d6f4e259e14f3bb0a8060ba685
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0103/FP32-INT8/person-reidentification-retail-0103.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.jpg b/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.jpg
new file mode 100644
index 00000000000..e161fc06113
Binary files /dev/null and b/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.jpg differ
diff --git a/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.md b/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.md
new file mode 100644
index 00000000000..59610492f92
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0107/description/person-reidentification-retail-0107.md
@@ -0,0 +1,53 @@
+# person-reidentification-retail-0107
+
+## Use Case and High-Level Description
+
+This is a person reidentification model for a general scenario. It uses a whole
+body image as an input and outputs an embedding vector to match a pair of images
+by the cosine distance. The model is based on the OmniScaleNet backbone developed for fast inference.
+A single reidentification head from the 1/16 scale
+feature map outputs an embedding vector of 256 floats.
+
+## Example
+
+![](./person-reidentification-retail-0107.jpg)
+
+## Specification
+
+| Metric                            | Value                                     |
+|-----------------------------------|-------------------------------------------|
+| GlobalMe-reID rank@1 accuracy     | 91.7%                                     |
+| GlobalMe-reID mAP                 | 63.4%                                     |
+| Pose coverage                     | Standing upright, parallel to image plane |
+| Support of occluded pedestrians   | YES                                       |
+| Occlusion coverage                | <50%                                      |
+| GFlops                            | 0.174                                     |
+| MParams                           | 0.183                                     |
+| Source framework                  | PyTorch\*                                 |
+
+The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility
+to locate at least one true positive in the top-1 rank.
+Mean Average Precision (mAP) is the mean across Average Precision (AP) of all queries.  AP is defined as
+the area under the
+[precision and recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
+
+## Performance
+
+## Inputs
+
+The net expects one input image of the shape [1x3x256x128] with the [BxCxHxW] format, where:
+- B - batch size
+- C - number of channels
+- H - image height
+- W - image width
+
+The expected color order is BGR.
+
+## Outputs
+
+The net outputs a blob with the [1, 256] shape named `descriptor`, which can be
+compared with other descriptors using the
+[cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0107/model.yml b/models/intel/person-reidentification-retail-0107/model.yml
new file mode 100644
index 00000000000..6b9d855b1ab
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0107/model.yml
@@ -0,0 +1,45 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Single embedding-based person reidentification model (the model is trade-off between
+  performance and accuracy)
+task_type: object_attributes
+files:
+  - name: FP32/person-reidentification-retail-0107.xml
+    size: 428538
+    sha256: 5e94d23e328ae8feb444e8ad472157a19ddc3ec7a5a0e6dd5ab3792b86d533cf
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP32/person-reidentification-retail-0107.xml
+  - name: FP32/person-reidentification-retail-0107.bin
+    size: 728532
+    sha256: 06c020c064a2659bf2e84319a1afbd1229a6493c31cb7d34d912f87637b18e9a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP32/person-reidentification-retail-0107.bin
+  - name: FP16/person-reidentification-retail-0107.xml
+    size: 428332
+    sha256: 30a3fe994ac4e1e2771d4baa96dc9c5d909ec169a44fcb1d5ceff1ffcda326b3
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP16/person-reidentification-retail-0107.xml
+  - name: FP16/person-reidentification-retail-0107.bin
+    size: 364300
+    sha256: 1966e4681a747a7767e144780069de5bf9440579c8153cd1c1aead69e4da2242
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP16/person-reidentification-retail-0107.bin
+  - name: FP32-INT8/person-reidentification-retail-0107.xml
+    size: 1213621
+    sha256: c8ca6da82c4db09c46a0465628fd881f9d501fdc8d360d3b66a50f89c5affe48
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP32-INT8/person-reidentification-retail-0107.xml
+  - name: FP32-INT8/person-reidentification-retail-0107.bin
+    size: 778660
+    sha256: acd7448d3d3d87d799c2b428b673af89f621d4c7b5d915800cb577f8af57c080
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0107/FP32-INT8/person-reidentification-retail-0107.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.jpg b/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.jpg
new file mode 100644
index 00000000000..7b70ee2a2bc
Binary files /dev/null and b/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.jpg differ
diff --git a/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.md b/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.md
new file mode 100644
index 00000000000..ad93d6fd4a5
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0200/description/person-reidentification-retail-0200.md
@@ -0,0 +1,53 @@
+# person-reidentification-retail-0200
+
+## Use Case and High-Level Description
+
+This is a person reidentification model for a general scenario. It uses a whole
+body image as an input and outputs an embedding vector to match a pair of images
+by the cosine distance. The model is based on the OmniScaleNet backbone developed for fast inference.
+A single reidentification head from the 1/16 scale
+feature map outputs an embedding vector of 256 floats.
+
+## Example
+
+![](./person-reidentification-retail-0200.jpg)
+
+## Specification
+
+| Metric                            | Value                                     |
+|-----------------------------------|-------------------------------------------|
+| GlobalMe-reID rank@1 accuracy     | 98.4%                                     |
+| GlobalMe-reID mAP                 | 87.2%                                     |
+| Pose coverage                     | Standing upright, parallel to image plane |
+| Support of occluded pedestrians   | YES                                       |
+| Occlusion coverage                | <50%                                      |
+| GFlops                            | 5.506                                     |
+| MParams                           | 4.723                                     |
+| Source framework                  | PyTorch\*                                 |
+
+The cumulative matching curve (CMC) at rank-1 is accuracy denoting the possibility
+to locate at least one true positive in the top-1 rank.
+Mean Average Precision (mAP) is the mean across Average Precision (AP) of all queries.  AP is defined as
+the area under the
+[precision and recall](https://en.wikipedia.org/wiki/Precision_and_recall) curve.
+
+## Performance
+
+## Inputs
+
+The net expects one input image of the shape [1x3x256x128] with the [BxCxHxW] format, where:
+- B - batch size
+- C - number of channels
+- H - image height
+- W - image width
+
+The expected color order is BGR.
+
+## Outputs
+
+The net outputs a blob with the [1, 512] shape named `descriptor`, which can be
+compared with other descriptors using the
+[cosine distance](https://en.wikipedia.org/wiki/Cosine_similarity).
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/person-reidentification-retail-0200/model.yml b/models/intel/person-reidentification-retail-0200/model.yml
new file mode 100644
index 00000000000..fc09c00bffb
--- /dev/null
+++ b/models/intel/person-reidentification-retail-0200/model.yml
@@ -0,0 +1,44 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  High accuracy single embedding-based person reidentification model
+task_type: object_attributes
+files:
+  - name: FP32/person-reidentification-retail-0200.xml
+    size: 445391
+    sha256: 51dccbd3c345850029333f5031c4c671d29b8a78bea4f8e440dbcfe04d9558b3
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP32/person-reidentification-retail-0200.xml
+  - name: FP32/person-reidentification-retail-0200.bin
+    size: 18800388
+    sha256: 264f2cf6ea48bc412ffeaa55604a571214efaa9d177ee516a2f4ad5b01e4f2c5
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP32/person-reidentification-retail-0200.bin
+  - name: FP16/person-reidentification-retail-0200.xml
+    size: 445236
+    sha256: 6a5738d72d6a3521c1f9a27f4db95c89734921829fd587d2802ded63792e9420
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP16/person-reidentification-retail-0200.xml
+  - name: FP16/person-reidentification-retail-0200.bin
+    size: 9400240
+    sha256: f813b64ae75e329cce2a0193967a3554ca6f730c2a88e20cd150c2645880322a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP16/person-reidentification-retail-0200.bin
+  - name: FP32-INT8/person-reidentification-retail-0200.xml
+    size: 1269200
+    sha256: be80869dcaefe1d267c3a09153bb9dbfe08c51e17e901799494c53322e9c3259
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP32-INT8/person-reidentification-retail-0200.xml
+  - name: FP32-INT8/person-reidentification-retail-0200.bin
+    size: 19002500
+    sha256: c58940b2e6e3e4dd18d9fad94aa4838137c5216afb978ad2a9f7c48533dce348
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-reidentification-retail-0200/FP32-INT8/person-reidentification-retail-0200.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-vehicle-bike-detection-crossroad-0078/model.yml b/models/intel/person-vehicle-bike-detection-crossroad-0078/model.yml
index 41363f3a425..d38750425dc 100644
--- a/models/intel/person-vehicle-bike-detection-crossroad-0078/model.yml
+++ b/models/intel/person-vehicle-bike-detection-crossroad-0078/model.yml
@@ -13,35 +13,34 @@
 # limitations under the License.
 
 description: >-
-  Person/Vehicle/Bike detector is based on SSD detection architecture, RMNet backbone,
-  and learnable image downscale block (like person-vehicle-bike-detection-crossroad-0066,
-  but with extra pooling). The model is intended for security surveillance applications
-  and works in a variety of scenes and weather/lighting conditions.
+  Multiclass (person -  vehicle -  non-vehicle) detector based on SSD detection architecture
+  -  RMNet backbone and learnable image downscale block (person-vehicle-bike-detection-crossroad-0066
+  with extra pooling)
 task_type: detection
 files:
   - name: FP32/person-vehicle-bike-detection-crossroad-0078.xml
-    size: 169499
-    sha256: f6ede9a43c2576726b05c29b726cd0c4d1831c3f43b88b7b8a40f521f5cd60d1
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.xml
+    size: 354808
+    sha256: a5c9fe84fe9a2b463eddd5b14535824ada1f238459ef6a96ddd5660b986bed47
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.xml
   - name: FP32/person-vehicle-bike-detection-crossroad-0078.bin
-    size: 4713900
-    sha256: 755e0442d18eadf6b6b1b83cf0b80e742e9e2f4c0792e5050509a9f376636a94
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.bin
+    size: 4713980
+    sha256: 178e05f0635b0ee35b577a9dd31ea6da2a2a842635793f1ad18907d00f3a966a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.bin
   - name: FP16/person-vehicle-bike-detection-crossroad-0078.xml
-    size: 169325
-    sha256: da449fa48224778d56e6ba8bb82a72d4115b4f7c31c5b1383dd0c363b7cb3488
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.xml
+    size: 354639
+    sha256: 153660e414e60ca83f08f8b955e0dd318210570106b43999f1d8a3fa0fa639fa
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.xml
   - name: FP16/person-vehicle-bike-detection-crossroad-0078.bin
-    size: 2356956
-    sha256: 361bb6e53c199e0b332cb27f11c553b08432b3e39218c8b865cf8116083703c8
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.bin
-  - name: INT8/person-vehicle-bike-detection-crossroad-0078.xml
-    size: 20853122
-    sha256: 5023c755c14ec9e22ff44968b71367965ac36a99b3bf1f05c1e20fdd4a28a98a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/INT8/person-vehicle-bike-detection-crossroad-0078.xml
-  - name: INT8/person-vehicle-bike-detection-crossroad-0078.bin
-    size: 4713900
-    sha256: 4e1bd5ee45a90b4fe834281d2b35b97c92ab553b6835e2677ec4de79fd446c9c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-0078/INT8/person-vehicle-bike-detection-crossroad-0078.bin
+    size: 2357042
+    sha256: a074ff0cad298ed9c35d0ce6ed58e09ee05216b907c97e6bb50f1b77a046bcfd
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.bin
+  - name: FP32-INT8/person-vehicle-bike-detection-crossroad-0078.xml
+    size: 960289
+    sha256: e9fca40ea26f33bc55646ae7c92baae95786f53914f11e40b8280a9e35b0a176
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP32-INT8/person-vehicle-bike-detection-crossroad-0078.xml
+  - name: FP32-INT8/person-vehicle-bike-detection-crossroad-0078.bin
+    size: 4796540
+    sha256: a5c797b9d0a2202c7e574bae55c90ea4cca594510fdfa3a1800c9832f466d52c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-0078/FP32-INT8/person-vehicle-bike-detection-crossroad-0078.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/person-vehicle-bike-detection-crossroad-1016/model.yml b/models/intel/person-vehicle-bike-detection-crossroad-1016/model.yml
index d7286785aec..9e6b2f6d77e 100644
--- a/models/intel/person-vehicle-bike-detection-crossroad-1016/model.yml
+++ b/models/intel/person-vehicle-bike-detection-crossroad-1016/model.yml
@@ -13,25 +13,33 @@
 # limitations under the License.
 
 description: >-
-  Multiclass (person -  vehicle -  non-vehicle) detector based on SSD detection
-  architecture -  MobileNetV2 backbone)
+  Multiclass (person -  vehicle -  non-vehicle) detector based on SSD detection architecture
+  -  MobileNetV2 backbone)
 task_type: detection
 files:
   - name: FP32/person-vehicle-bike-detection-crossroad-1016.xml
-    size: 82676
-    sha256: 56d2b92139749dc8d35fca1ee2633f97f2146e0857f3cf76ca9791c107286ffd
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.xml
+    size: 194333
+    sha256: 040bded9370548d6ca02286b764334291c4ce6edb3ca6facd1758490a6433230
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.xml
   - name: FP32/person-vehicle-bike-detection-crossroad-1016.bin
-    size: 11547916
-    sha256: 0858938f00ee87fb47c632f47039316f6060a096e74dd3e5dc061d850b4b702d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.bin
+    size: 11548004
+    sha256: 61c9deaca903bb107aecfc31faeb402c894e0d43ab3817db8d9d05d43dfa68cf
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.bin
   - name: FP16/person-vehicle-bike-detection-crossroad-1016.xml
-    size: 82582
-    sha256: a040f8d3e81b2d1a352318bc0fd8d8b9dd9fbf7a9c591cef7d0c2e7171efbfe8
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.xml
+    size: 194219
+    sha256: 3392a26b381ebbfa837cafb976a828fd8519ff58be08aac72cb54f4f40b58184
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.xml
   - name: FP16/person-vehicle-bike-detection-crossroad-1016.bin
-    size: 5773968
-    sha256: 3d22081d3b1a8c3e24dcbbe23b677a92ad144530880df33f070615e42901cc55
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.bin
+    size: 5774054
+    sha256: a0ba3bc9ca17330c731b395153651c22a666050cd06413c01059070681dc79a7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.bin
+  - name: FP32-INT8/person-vehicle-bike-detection-crossroad-1016.xml
+    size: 510391
+    sha256: 82d95cf77a1a5a4c2d0d8a6c364229700f293ccd8df883a081c2dc33f4025462
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP32-INT8/person-vehicle-bike-detection-crossroad-1016.xml
+  - name: FP32-INT8/person-vehicle-bike-detection-crossroad-1016.bin
+    size: 11777480
+    sha256: 0abdc201405b2f910f3ddd49307afd89ee43ab80009f9827b4f16e7aa7274157
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/person-vehicle-bike-detection-crossroad-1016/FP32-INT8/person-vehicle-bike-detection-crossroad-1016.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/product-detection-0001/description/product-detection-0001.jpg b/models/intel/product-detection-0001/description/product-detection-0001.jpg
new file mode 100644
index 00000000000..decba1427c3
Binary files /dev/null and b/models/intel/product-detection-0001/description/product-detection-0001.jpg differ
diff --git a/models/intel/product-detection-0001/description/product-detection-0001.md b/models/intel/product-detection-0001/description/product-detection-0001.md
new file mode 100644
index 00000000000..ddbebcd31f5
--- /dev/null
+++ b/models/intel/product-detection-0001/description/product-detection-0001.md
@@ -0,0 +1,48 @@
+# product-detection-0001
+
+## Use Case and High-Level Description
+
+A product detector based on the SSD-lite architecture with [MobileNetV2](https://arxiv.org/pdf/1801.04381.pdf) as a backbone for self-checkout points of sale-related scenes.
+The network can detect 12 classes of objects (`sprite`, `kool-aid`, `extra`, `ocelo`, `finish`, `mtn_dew`, `best_foods`, `gatorade`, `heinz`, `ruffles`, `pringles`, `del_monte`). Labels 0 and 1 are related to `background_label` and `undefined` correspondingly.
+
+## Example
+
+![](./product-detection-0001.jpg)
+
+## Specification
+
+| Metric                                                            | Value    |
+|-------------------------------------------------------------------|----------|
+| Average Precision (AP) @[ IoU=0.50:0.95,  area=all, maxDets=100 ] | 0.715    |
+| GFlops                                                            | 3.598    |
+| MParams                                                           | 3.212    |
+| Source framework                                                  | PyTorch* |
+
+## Performance
+
+## Inputs
+
+1. Name: `input` , shape: [1x3x512x512]. An input image in the format [BxCxHxW],
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+
+## Outputs
+
+1. The net outputs a blob with the [1, 1, N, 7] shape, where N is the number of detected
+   bounding boxes. For each detection, the description has the [`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`] format,
+   where:
+
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/product-detection-0001/model.yml b/models/intel/product-detection-0001/model.yml
new file mode 100644
index 00000000000..3f71e250e30
--- /dev/null
+++ b/models/intel/product-detection-0001/model.yml
@@ -0,0 +1,44 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Product detection based on MobileNetV2.
+task_type: detection
+files:
+  - name: FP32/product-detection-0001.xml
+    size: 273207
+    sha256: ec88b66d16f0899e7a833c5da5de0be3304062a926dd52662cbca4a2c68247bc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP32/product-detection-0001.xml
+  - name: FP32/product-detection-0001.bin
+    size: 12850036
+    sha256: 93f2ccd0ce7ba88f190f51b8a62d67fd5178444496f068dc33488fb1949e2726
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP32/product-detection-0001.bin
+  - name: FP16/product-detection-0001.xml
+    size: 273019
+    sha256: c6488db369f51c892172b9adc83f466553c7c36f9e4dac531891c1992c79051d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP16/product-detection-0001.xml
+  - name: FP16/product-detection-0001.bin
+    size: 6425070
+    sha256: ecc6f6bdae9a49c1749a324e0e98320a0a9aae97cc0c2b536853ee46b9178690
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP16/product-detection-0001.bin
+  - name: FP32-INT8/product-detection-0001.xml
+    size: 674722
+    sha256: 8320116effb73fdca11adb7238b7dd95f93e37e359fc44ba08ac35aa35317dd3
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP32-INT8/product-detection-0001.xml
+  - name: FP32-INT8/product-detection-0001.bin
+    size: 13101168
+    sha256: 741f6bee9d617ca20a5c5813ed3defc240b4fdef84c4c2582e3e4bb586460d1f
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/product-detection-0001/FP32-INT8/product-detection-0001.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/resnet-50-int8-sparse-v1-tf-0001/description/resnet-50-int8-sparse-v1-tf-0001.md b/models/intel/resnet-50-int8-sparse-v1-tf-0001/description/resnet-50-int8-sparse-v1-tf-0001.md
deleted file mode 100644
index e3f39d2a4ba..00000000000
--- a/models/intel/resnet-50-int8-sparse-v1-tf-0001/description/resnet-50-int8-sparse-v1-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# resnet-50-int8-sparse-v1-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Resnet-50 v1 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **28.4%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `resnet-50-int8-sparse-v1-tf-0001` is the usual object classifier output for the 1000 different classifications matching those in the ImageNet database.
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 6.996         |
-| MParams           | 25.530        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 75.05% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        75.05% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1000`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/resnet-50-int8-sparse-v1-tf-0001/model.yml b/models/intel/resnet-50-int8-sparse-v1-tf-0001/model.yml
deleted file mode 100644
index d9c5131dda3..00000000000
--- a/models/intel/resnet-50-int8-sparse-v1-tf-0001/model.yml
+++ /dev/null
@@ -1,49 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Resnet-50 v1 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then pruned
-  to **28.4%** of sparsity and quantized to INT8 fixed-point precision using
-  so-called Quantization-aware training approach implemented in TensorFlow framework.
-  The sparsity is represented by zeros inside the weights of Convolutional and
-  Fully-conneted layers. For details about the original floating point model,
-  check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-  The model input is a blob that consists of a single image of "1x224x224x3"
-  in BGR order.
-
-  The model output for `resnet-50-int8-sparse-v1-tf-0001` is the usual object
-  classifier output for the 1000 different classifications matching those in
-  the ImageNet database.
-task_type: classification
-files:
-  - name: FP32/resnet-50-int8-sparse-v1-tf-0001.xml
-    size: 1445288
-    sha256: f15e06873c306a33a5586e4fa6a08e0792a69021a57c724ca3a5b56b7c2b6656
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v1-tf-0001/FP32/resnet-50-int8-sparse-v1-tf-0001.xml
-  - name: FP32/resnet-50-int8-sparse-v1-tf-0001.bin
-    size: 102121952
-    sha256: 6fe77c36fad1aa67a813ab55a9e087a9ed799930b06bb87a6e30454b54caf7e3
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v1-tf-0001/FP32/resnet-50-int8-sparse-v1-tf-0001.bin
-  - name: FP16/resnet-50-int8-sparse-v1-tf-0001.xml
-    size: 1445229
-    sha256: 7fd5efca06819c73291ea10e80909efc4f1acfdaa807e58494424ddba0f7eedc
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v1-tf-0001/FP16/resnet-50-int8-sparse-v1-tf-0001.xml
-  - name: FP16/resnet-50-int8-sparse-v1-tf-0001.bin
-    size: 51060996
-    sha256: 305324c5218954254fba6ae9ae4fa76359a06b046ba6671120454f33441c91ea
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v1-tf-0001/FP16/resnet-50-int8-sparse-v1-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/resnet-50-int8-sparse-v2-tf-0001/description/resnet-50-int8-sparse-v2-tf-0001.md b/models/intel/resnet-50-int8-sparse-v2-tf-0001/description/resnet-50-int8-sparse-v2-tf-0001.md
deleted file mode 100644
index c76b87e49f5..00000000000
--- a/models/intel/resnet-50-int8-sparse-v2-tf-0001/description/resnet-50-int8-sparse-v2-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# resnet-50-int8-sparse-v2-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Resnet-50 v1 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then pruned to **60.4%** of sparsity and quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. The sparsity is represented by zeros inside the weights of Convolutional and Fully-conneted layers. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `resnet-50-int8-sparse-v2-tf-0001` is the usual object classifier output for the 1000 different classifications matching those in the ImageNet database.
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 6.996         |
-| MParams           | 25.530        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 74.56% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |        74.56% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1000`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/resnet-50-int8-sparse-v2-tf-0001/model.yml b/models/intel/resnet-50-int8-sparse-v2-tf-0001/model.yml
deleted file mode 100644
index 4bb59b53ef0..00000000000
--- a/models/intel/resnet-50-int8-sparse-v2-tf-0001/model.yml
+++ /dev/null
@@ -1,49 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Resnet-50 v1 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then pruned
-  to **60.4%** of sparsity and quantized to INT8 fixed-point precision using
-  so-called Quantization-aware training approach implemented in TensorFlow framework.
-  The sparsity is represented by zeros inside the weights of Convolutional and
-  Fully-conneted layers. For details about the original floating point model,
-  check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-  The model input is a blob that consists of a single image of "1x224x224x3"
-  in BGR order.
-
-  The model output for `resnet-50-int8-sparse-v2-tf-0001` is the usual object
-  classifier output for the 1000 different classifications matching those in
-  the ImageNet database.
-task_type: classification
-files:
-  - name: FP32/resnet-50-int8-sparse-v2-tf-0001.xml
-    size: 1452432
-    sha256: 1dad39da1dc2a0b0ca75e396ad4574e98dafdff9388c7338293c31b4d95d6cdf
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v2-tf-0001/FP32/resnet-50-int8-sparse-v2-tf-0001.xml
-  - name: FP32/resnet-50-int8-sparse-v2-tf-0001.bin
-    size: 102121952
-    sha256: 4566cf3a3124ff98a911ac4c3092cd4198d83cf94e7fd5003d36a2e764c2319a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v2-tf-0001/FP32/resnet-50-int8-sparse-v2-tf-0001.bin
-  - name: FP16/resnet-50-int8-sparse-v2-tf-0001.xml
-    size: 1452373
-    sha256: 29aa5eb3d85f2b14ac148c8aac4349ba7d0a89c857646b749b9a2b74310ba460
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v2-tf-0001/FP16/resnet-50-int8-sparse-v2-tf-0001.xml
-  - name: FP16/resnet-50-int8-sparse-v2-tf-0001.bin
-    size: 51060996
-    sha256: c9f0d85a863e6d9c4db9be390862c2530535dd67016a3b96f764f9e07715738f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-sparse-v2-tf-0001/FP16/resnet-50-int8-sparse-v2-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/resnet-50-int8-tf-0001/description/resnet-50-int8-tf-0001.md b/models/intel/resnet-50-int8-tf-0001/description/resnet-50-int8-tf-0001.md
deleted file mode 100644
index f697af59293..00000000000
--- a/models/intel/resnet-50-int8-tf-0001/description/resnet-50-int8-tf-0001.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# resnet-50-int8-tf-0001
-
-## Use Case and High-Level Description
-
-This is the Resnet-50 v1 model that is designed to perform image classification. The model has been pretrained on the ImageNet image database and then quantized to INT8 fixed-point precision using so-called Quantization-aware training approach implemented in TensorFlow framework. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-The model input is a blob that consists of a single image of "1x224x224x3" in BGR order.
-
-The model output for `resnet-50-int8-tf-0001` is the usual object classifier output for the 1000 different classifications matching those in the ImageNet database.
-
-## Example
-
-## Specification
-
-| Metric            | Value         |
-|-------------------|---------------|
-| Type              | Classification|
-| GFLOPs            | 6.996         |
-| MParams           | 25.530        |
-| Source framework  | TensorFlow    |
-
-## Accuracy
-
-The quality metrics calculated on ImageNet validation dataset is 74.6% accuracy top-1.
-
-| Metric                    | Value         |
-|---------------------------|---------------|
-| Accuracy top-1 (ImageNet) |         74.6% |
-
-## Performance
-
-## Input
-
-Image, shape - `1,224,224,3`, format is `B,H,W,C` where:
-
-- `B` - batch size
-- `H` - height
-- `W` - width
-- `C` - channel
-
-Channel order is `BGR`
-
-## Output
-
-Object classifier according to ImageNet classes, shape -`1,1000`, output data format is `B,C` where:
-
-- `B` - batch size
-- `C` - predicted probabilities for each class in  [0, 1] range
-
diff --git a/models/intel/resnet-50-int8-tf-0001/model.yml b/models/intel/resnet-50-int8-tf-0001/model.yml
deleted file mode 100644
index 9feb23f5af2..00000000000
--- a/models/intel/resnet-50-int8-tf-0001/model.yml
+++ /dev/null
@@ -1,47 +0,0 @@
-# Copyright (c) 2019 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-description: >-
-  This is the Resnet-50 v1 model that is designed to perform image classification.
-  The model has been pretrained on the ImageNet image database and then quantized
-  to INT8 fixed-point precision using so-called Quantization-aware training approach
-  implemented in TensorFlow framework. For details about the original floating
-  point model, check out the [paper](https://arxiv.org/pdf/1512.03385.pdf).
-
-  The model input is a blob that consists of a single image of "1x224x224x3"
-  in BGR order.
-
-  The model output for `resnet-50-int8-tf-0001` is the usual object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
-task_type: classification
-files:
-  - name: FP32/resnet-50-int8-tf-0001.xml
-    size: 1449034
-    sha256: 6832a01f08734ec738ec578ffd3ed8c0be1a5000b02a6c51aa60824a7943cd47
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-tf-0001/FP32/resnet-50-int8-tf-0001.xml
-  - name: FP32/resnet-50-int8-tf-0001.bin
-    size: 102121960
-    sha256: bc907b55caf9cc5dc045785105d99b56ac57ea5cf58f5fd89032f4aca33d6060
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-tf-0001/FP32/resnet-50-int8-tf-0001.bin
-  - name: FP16/resnet-50-int8-tf-0001.xml
-    size: 1448974
-    sha256: afa97920b779fc8c2723120327238e16692bb33e39a4b8f6bafa8ca5c502e3e4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-tf-0001/FP16/resnet-50-int8-tf-0001.xml
-  - name: FP16/resnet-50-int8-tf-0001.bin
-    size: 51061004
-    sha256: 155775217a5571bcef095dc2337154467ddafb161af2351b7b18bc445d9ffd86
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet-50-int8-tf-0001/FP16/resnet-50-int8-tf-0001.bin
-framework: dldt
-license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/resnet18-xnor-binary-onnx-0001/description/resnet18-xnor-binary-onnx-0001.md b/models/intel/resnet18-xnor-binary-onnx-0001/description/resnet18-xnor-binary-onnx-0001.md
new file mode 100644
index 00000000000..fae03f745d6
--- /dev/null
+++ b/models/intel/resnet18-xnor-binary-onnx-0001/description/resnet18-xnor-binary-onnx-0001.md
@@ -0,0 +1,42 @@
+# resnet18-xnor-binary-onnx-0001
+
+## Use Case and High-Level Description
+
+This is a classical classification network for 1000 classes trained on ImageNet.
+The difference is that most convolutional layers were replaced by binary ones that can be implemented as XNOR+POPCOUNT operations.
+Only input, final and shortcut layers were kept as FP32, all the rest convolutional layers are replaced by binary convolution layers.
+
+
+## Specification
+| Metric          | Value    |
+|-----------------|----------|
+| Image size      | 224x224  |
+| Source framework  | PyTorch\*             |
+
+## Accuracy
+
+The quality metrics calculated on ImageNet validation dataset is 61.71% accuracy
+
+| Metric                    | Value         |
+|---------------------------|---------------|
+| Accuracy top-1 (ImageNet) |        61.71% |
+
+## Performance
+
+## Inputs
+
+A blob with a BGR image in the format: [B, C=3, H=224, W=224], where:
+
+- B – batch size
+- C – number of channels
+- H – image height
+- W – image width
+
+It is supposed that input is BGR in 0..255 range
+
+## Outputs
+
+The output is a blob with the shape [B, C=1000].
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/resnet18-xnor-binary-onnx-0001/model.yml b/models/intel/resnet18-xnor-binary-onnx-0001/model.yml
new file mode 100644
index 00000000000..f88752b8d38
--- /dev/null
+++ b/models/intel/resnet18-xnor-binary-onnx-0001/model.yml
@@ -0,0 +1,36 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  ResNet-18 Binary with XNOR weight binarization
+task_type: classification
+files:
+  - name: FP32-INT1/resnet18-xnor-binary-onnx-0001.xml
+    size: 93590
+    sha256: 219cdef5a3cfb82ecc895983a9840def9145b717e6ce54327cfff47ca076e8e7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet18-xnor-binary-onnx-0001/FP32-INT1/resnet18-xnor-binary-onnx-0001.xml
+  - name: FP32-INT1/resnet18-xnor-binary-onnx-0001.bin
+    size: 4190944
+    sha256: 69f0fef2a4373fb4a72a9fe99442f14e8d367470422f9068976284114193e833
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet18-xnor-binary-onnx-0001/FP32-INT1/resnet18-xnor-binary-onnx-0001.bin
+  - name: FP16-INT1/resnet18-xnor-binary-onnx-0001.xml
+    size: 93564
+    sha256: 6b9226d527779f3528cafe97ce81350e0570b21e0c9c018faaed15e47bde8389
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet18-xnor-binary-onnx-0001/FP16-INT1/resnet18-xnor-binary-onnx-0001.xml
+  - name: FP16-INT1/resnet18-xnor-binary-onnx-0001.bin
+    size: 2782080
+    sha256: 57a2767a0dd7eddb59830b93a01ce5f6ef0906abb252602f89f7dd28071a6dd5
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet18-xnor-binary-onnx-0001/FP16-INT1/resnet18-xnor-binary-onnx-0001.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/resnet50-binary-0001/model.yml b/models/intel/resnet50-binary-0001/model.yml
index 40dbfe9ecd2..a8a970d9131 100644
--- a/models/intel/resnet50-binary-0001/model.yml
+++ b/models/intel/resnet50-binary-0001/model.yml
@@ -13,20 +13,24 @@
 # limitations under the License.
 
 description: >-
-  This is a classical classification network for 1000 classes trained on ImageNet.
-  The difference is that most convolutional layers were replaced by binary once
-  that can be implemented as XNOR+POPCOUN operations. Only input, final and shortcut
-  layers were kept as FP32, all the rest convolutional layers are replaced by
-  BinaryConvolution layers.
+  ResNet-50 Binary
 task_type: classification
 files:
-  - name: INT1/resnet50-binary-0001.xml
-    size: 169246
-    sha256: 1a7e41ab273f9e7b064e60e889ba2f13ce1b07cb4610096bd3abef33a93bf992
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet50-binary-0001/INT1/resnet50-binary-0001.xml
-  - name: INT1/resnet50-binary-0001.bin
-    size: 22112960
-    sha256: e843a458ae786f860698919709fb0852ef8138d4461ce8c744f96fe29ef0d580
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/resnet50-binary-0001/INT1/resnet50-binary-0001.bin
+  - name: FP32-INT1/resnet50-binary-0001.xml
+    size: 227764
+    sha256: 011296b3a0ef3311597f7425339a8b3d1aad6c9b3f5f4fd58c2a467a24271296
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet50-binary-0001/FP32-INT1/resnet50-binary-0001.xml
+  - name: FP32-INT1/resnet50-binary-0001.bin
+    size: 22112976
+    sha256: 35c724a526d54d32badf20a5bf929925d333a4e67bcf493c854ce4d5a3e258cb
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet50-binary-0001/FP32-INT1/resnet50-binary-0001.bin
+  - name: FP16-INT1/resnet50-binary-0001.xml
+    size: 227670
+    sha256: 4329f94b2c23852cfd946e75dd38c161a88d99590de99906d5648e03f259ea2d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet50-binary-0001/FP16-INT1/resnet50-binary-0001.xml
+  - name: FP16-INT1/resnet50-binary-0001.bin
+    size: 12348784
+    sha256: cb98ba6a96cc46d1eae9786e964b1fad2b41d74470c2032a1961fb66ece91332
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/resnet50-binary-0001/FP16-INT1/resnet50-binary-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/road-segmentation-adas-0001/model.yml b/models/intel/road-segmentation-adas-0001/model.yml
index 6d176777de3..f6db78dc4de 100644
--- a/models/intel/road-segmentation-adas-0001/model.yml
+++ b/models/intel/road-segmentation-adas-0001/model.yml
@@ -13,25 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is a segmentation network to classify each pixel into four classes: BG,
-  road, curb, mark.
+  Multiclass (BG -  road -  curbs -  marks) segmentation based on ENET -  using depthwise
+  convolutions and without ELU operations and without concatenation
 task_type: semantic_segmentation
 files:
   - name: FP32/road-segmentation-adas-0001.xml
-    size: 172322
-    sha256: 59de171ea5117d88fca37252bf614b15acb20424c7db09803f364a0a65a27309
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.xml
+    size: 357682
+    sha256: 7c1fabbec883c4297e7b82037afd8262c8f1afba3bb23863bbcc6177fce91706
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.xml
   - name: FP32/road-segmentation-adas-0001.bin
-    size: 737136
-    sha256: e4ec8fa66deb6904b5b6faa109fa699098cc1f947bf5216c6e31595ec397c569
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.bin
+    size: 737200
+    sha256: ae43e7d5dd1ad62cbe62a2d8aa5dd3721b7581f26763ba3c69660da2a91c3d87
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.bin
   - name: FP16/road-segmentation-adas-0001.xml
-    size: 172167
-    sha256: 2bbe4bdc357880b73d6f7968e85870fbae4f004196c87d5836f27f4c20e3db31
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.xml
+    size: 357527
+    sha256: 0e90b547c84bdac869f5d9e227fc2df9da64f4de787886ac4d5c0d89b73344d7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.xml
   - name: FP16/road-segmentation-adas-0001.bin
-    size: 368568
-    sha256: 292b8c8789d66f102ffb9b87104b39488bfa55293ef97e7d6a50439762cdd884
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.bin
+    size: 368632
+    sha256: ddbc38aaee27ed8166d1190519380a91cdea8cf7f4bc71585d939fd6ead6b159
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.bin
+  - name: FP32-INT8/road-segmentation-adas-0001.xml
+    size: 1057411
+    sha256: 44d6a4fac2f88498c465ebe83d2a2189e16e12f389f7fc4c33a564cc99836a0c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP32-INT8/road-segmentation-adas-0001.xml
+  - name: FP32-INT8/road-segmentation-adas-0001.bin
+    size: 783048
+    sha256: 6c6cb1de3831c294f79cc6d693edb5d36874608dd4bfd45b2ee88dc6df390b98
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/road-segmentation-adas-0001/FP32-INT8/road-segmentation-adas-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/semantic-segmentation-adas-0001/model.yml b/models/intel/semantic-segmentation-adas-0001/model.yml
index f12e299ecea..d1602603eb9 100644
--- a/models/intel/semantic-segmentation-adas-0001/model.yml
+++ b/models/intel/semantic-segmentation-adas-0001/model.yml
@@ -13,64 +13,34 @@
 # limitations under the License.
 
 description: >-
-  This is a segmentation network to classify each pixel into 20 classes:
-
-  - road
-
-  - sidewalk
-
-  - building
-
-  - wall
-
-  - fence
-
-  - pole
-
-  - traffic light
-
-  - traffic sign
-
-  - vegetation
-
-  - terrain
-
-  - sky
-
-  - person
-
-  - rider
-
-  - car
-
-  - truck
-
-  - bus
-
-  - train
-
-  - motorcycle
-
-  - bicycle
-
-  - ego-vehicle
+  Multiclass (road -  sidewalk -  building -  wall -  fence -  pole -  traffic light
+  -  traffic sign -  vegetation -  terrain -  sky -  person -  rider -  car -  truck
+  -  bus -  train -  motorcycle -  bicycle -  ego-vehicle) segmentation based on ICNet
 task_type: semantic_segmentation
 files:
   - name: FP32/semantic-segmentation-adas-0001.xml
-    size: 90871
-    sha256: 1b39f23ab44725db2da4641a6500bfd913017a1b9f4ae919abd25bde75ae937f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.xml
+    size: 182087
+    sha256: c3fc63223316e68dc35d147661906a23e83a0655f72a6ca5dabc3251e98d9566
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.xml
   - name: FP32/semantic-segmentation-adas-0001.bin
-    size: 26743560
-    sha256: 5a616b105fa42f574e4d23cfc227c10b8bdcc0ba0e66864d7aa4b8a269b7cc76
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.bin
+    size: 26743564
+    sha256: 6d2592c07c91ed1de76c683a2c5753c89f0a61c215bc553f2a6b30faa05b37ba
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.bin
   - name: FP16/semantic-segmentation-adas-0001.xml
-    size: 90790
-    sha256: 5ef7a87d2ca428b95811023964a49ed3f90dc1905e79c9701b4d43e607ebcc1c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.xml
+    size: 182006
+    sha256: b446ba0eb6b0da3888b6052263f1c951abc5737966a8ed067f9cb912bce8d251
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.xml
   - name: FP16/semantic-segmentation-adas-0001.bin
-    size: 13371780
-    sha256: 8c39dcb0d3569003264165eda163833eef2d0803121147ab06f46697e4f8b4c4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.bin
+    size: 13371824
+    sha256: a6366b6cd8e6456bdea4d2709e4d062c434a94cfabb62905dfbb4cd50b3df5d5
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.bin
+  - name: FP32-INT8/semantic-segmentation-adas-0001.xml
+    size: 506262
+    sha256: feba4beb19e206bfa06017c13bc8eac4001a5863043ee2d87316039958323c85
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP32-INT8/semantic-segmentation-adas-0001.xml
+  - name: FP32-INT8/semantic-segmentation-adas-0001.bin
+    size: 26858920
+    sha256: 6a2362f6c06fe1d569699d82f461245e7233e4cbc99f729baba3acec3bf5207b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/semantic-segmentation-adas-0001/FP32-INT8/semantic-segmentation-adas-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/single-image-super-resolution-1032/description/single-image-super-resolution-1032.md b/models/intel/single-image-super-resolution-1032/description/single-image-super-resolution-1032.md
index 9ff205f613a..884bc166ca2 100644
--- a/models/intel/single-image-super-resolution-1032/description/single-image-super-resolution-1032.md
+++ b/models/intel/single-image-super-resolution-1032/description/single-image-super-resolution-1032.md
@@ -26,7 +26,7 @@ Super resolution:
 | PSNR                            | 29.29 dB                                  |
 | GFlops                          | 11.654                                    |
 | MParams                         | 0.030                                     |
-| Source framework                | Pytorch*                                  |
+| Source framework                | PyTorch*                                  |
 
 For reference, PSNR for bicubic upsampling on test dataset is 26.79 dB.
 
diff --git a/models/intel/single-image-super-resolution-1032/model.yml b/models/intel/single-image-super-resolution-1032/model.yml
index c7cab2adcc7..59a874eea63 100644
--- a/models/intel/single-image-super-resolution-1032/model.yml
+++ b/models/intel/single-image-super-resolution-1032/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  An Attention-Based Approach for Single Image Super Resolution <https://arxiv.org/pdf/1807.06779.pdf>
-  but with reduced number of channels and changes in network achitecture. It enhances
-  the resolution of the input image by a factor of 4.
+  Super resolution model
 task_type: image_processing
 files:
   - name: FP32/single-image-super-resolution-1032.xml
-    size: 26530
-    sha256: b822073958fa1098054dca13a6f4a63de182179a037cdb6ad46fd6bcafad4728
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.xml
+    size: 41194
+    sha256: 5e68e407a9abd030ecb62d5f1e96f8b76c0fb81ec52fc8be2078886868d480fa
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.xml
   - name: FP32/single-image-super-resolution-1032.bin
-    size: 119424
-    sha256: e2403b56bd57b0e7c68e33dad3fb1af5e3f0be4a3ad7c7cbc1836fddf0c062b0
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.bin
+    size: 119556
+    sha256: 82b5338155835d6b4307721e6a9b28775a4550b61c31d76aac1a8b5d5612d7dc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.bin
   - name: FP16/single-image-super-resolution-1032.xml
-    size: 26507
-    sha256: ea929389e3196053d3066323ee69d03d5c766521868d162f0aa01ddcbfdc90c2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.xml
+    size: 41171
+    sha256: 2a420d86b919aeb7eafb752b09b230b390044f35b6ba9709117594fe310f1ab7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.xml
   - name: FP16/single-image-super-resolution-1032.bin
-    size: 59752
-    sha256: ac8a8c9387098ae9bc0cbda82cfe3235c9d2f9652277bbf07d78b96d2c4ff7e9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.bin
-  - name: INT8/single-image-super-resolution-1032.xml
-    size: 40591
-    sha256: 6e0ad9d25a9f1d31733edec7c220c3ff5d2a3e0c02c1793313067b5cb4692a56
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/INT8/single-image-super-resolution-1032.xml
-  - name: INT8/single-image-super-resolution-1032.bin
-    size: 119424
-    sha256: 89f809550199ccc33f65e54377ae88098fceacdb5f71800fe04ab2c9439e1818
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1032/INT8/single-image-super-resolution-1032.bin
+    size: 59882
+    sha256: abae5907d40ef7e47d680435a99484b74076a985a6b8c3353b64fa77e6d3c149
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.bin
+  - name: FP32-INT8/single-image-super-resolution-1032.xml
+    size: 122462
+    sha256: f6aa087d5c7c43ddf7a0a4f63fc5f6c747ef7ecdd9fa6a7c953de063a5599547
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP32-INT8/single-image-super-resolution-1032.xml
+  - name: FP32-INT8/single-image-super-resolution-1032.bin
+    size: 121724
+    sha256: e14739375434b1645d0b6745947aae73fd9b915750b033ce08f25aab93b0b25e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1032/FP32-INT8/single-image-super-resolution-1032.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/single-image-super-resolution-1033/description/single-image-super-resolution-1033.md b/models/intel/single-image-super-resolution-1033/description/single-image-super-resolution-1033.md
index 78867284350..92878b1ae1b 100644
--- a/models/intel/single-image-super-resolution-1033/description/single-image-super-resolution-1033.md
+++ b/models/intel/single-image-super-resolution-1033/description/single-image-super-resolution-1033.md
@@ -26,7 +26,7 @@ Super resolution:
 | PSNR                            | 30.97 dB                                  |
 | GFlops                          | 16.062                                    |
 | MParams                         | 0.030                                     |
-| Source framework                | Pytorch*                                  |
+| Source framework                | PyTorch*                                  |
 
 For reference, PSNR for bicubic upsampling on test dataset is 28.48 dB.
 
diff --git a/models/intel/single-image-super-resolution-1033/model.yml b/models/intel/single-image-super-resolution-1033/model.yml
index fec4807bada..b1b4a9b3ae6 100644
--- a/models/intel/single-image-super-resolution-1033/model.yml
+++ b/models/intel/single-image-super-resolution-1033/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  An Attention-Based Approach for Single Image Super Resolution <https://arxiv.org/pdf/1807.06779.pdf>
-  but with reduced number of channels and changes in network achitecture. It enhances
-  the resolution of the input image by a factor of 3.
+  Super resolution model
 task_type: image_processing
 files:
   - name: FP32/single-image-super-resolution-1033.xml
-    size: 23463
-    sha256: 7c5526e47a0299af889d206b5a64e96fbdccbd980701d16cc6886aa545173d3b
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.xml
+    size: 36334
+    sha256: 1d51ca5a62c9b35532414cffd9c7b6dd874d1dfa8e728079161f748e9729ca0e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.xml
   - name: FP32/single-image-super-resolution-1033.bin
-    size: 121720
-    sha256: 4f788a5d05373a8e68a20df7bde17347dbaf1531db0ed7ca340977c0dcb18b7a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.bin
+    size: 121812
+    sha256: 47b0c1d3b28c1193fdb7838cebdad29e010abfdc7664ef06257bd659f4f08474
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.bin
   - name: FP16/single-image-super-resolution-1033.xml
-    size: 23449
-    sha256: 8a2b2833ed71fbf2d6661bad264b61500169dabcc852f3181c8d87900f077865
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.xml
+    size: 36318
+    sha256: ede3cf9c574810450aeb6f14dfe7ddfbdfe5d1e47e277d7c5aea7987ca0bb802
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.xml
   - name: FP16/single-image-super-resolution-1033.bin
-    size: 60880
-    sha256: 0c0bd11d77f6a23242592db1c6ae0a3f0c8b472952aa3c2f5449cc448f68d90f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.bin
-  - name: INT8/single-image-super-resolution-1033.xml
-    size: 36987
-    sha256: 68b7200b8d656473297f7febf9443965a260852061a724d4d7589a23bc93410a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/INT8/single-image-super-resolution-1033.xml
-  - name: INT8/single-image-super-resolution-1033.bin
-    size: 121720
-    sha256: 02e947ddd1aa362f1a48cda45aa716637b32b0d19dae88b5bbe15bff0a4a2276
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/single-image-super-resolution-1033/INT8/single-image-super-resolution-1033.bin
+    size: 60970
+    sha256: 771dd5b865006aea3a04a6b5e858c34fe619913d8aa1279cd9b6a40c05ef0df7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.bin
+  - name: FP32-INT8/single-image-super-resolution-1033.xml
+    size: 113556
+    sha256: 8e1b65fd3cdcc6d016b1495e7f73f5f353446df71151619800dc5950b2c23ad8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP32-INT8/single-image-super-resolution-1033.xml
+  - name: FP32-INT8/single-image-super-resolution-1033.bin
+    size: 124040
+    sha256: d066c186597ae2d74f42250945a8f0c315f284e4d1fd7126c263228cc94e8c13
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/single-image-super-resolution-1033/FP32-INT8/single-image-super-resolution-1033.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-detection-0003/model.yml b/models/intel/text-detection-0003/model.yml
index 7ab786695f2..7bcb16038cf 100644
--- a/models/intel/text-detection-0003/model.yml
+++ b/models/intel/text-detection-0003/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Text detector based on PixelLink <https://arxiv.org/pdf/1801.01315.pdf> architecture
-  with MobileNetV2-like <https://arxiv.org/pdf/1801.04381.pdf> as a backbone
-  for indoor/outdoor scenes.
+  Detects oriented text.
 task_type: detection
 files:
   - name: FP32/text-detection-0003.xml
-    size: 83483
-    sha256: c57f9e037e7bed7219ddf275a1773106b0101f6567df7b79e42e838798a384d9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/FP32/text-detection-0003.xml
+    size: 178394
+    sha256: e63aae42d6d37fd4aab0bbf553554af20556aea218ad0465f2bfd721c5cba25d
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP32/text-detection-0003.xml
   - name: FP32/text-detection-0003.bin
-    size: 26986232
-    sha256: 4ce684ad28cb70dc464565e1a476718845e3cc190fca14f385117f9ad970bcc4
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/FP32/text-detection-0003.bin
+    size: 26986280
+    sha256: 03430c799fa873e859eb0018318e741fd58b8ff6b9891949cb931876db3bf0e1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP32/text-detection-0003.bin
   - name: FP16/text-detection-0003.xml
-    size: 83403
-    sha256: b59554dd0e5f789fc5cacdbe7e5472ee977e368a6ca2a7023e99168c8f0bae97
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/FP16/text-detection-0003.xml
+    size: 178314
+    sha256: a24e90b48c701a6cce64ad279c8b00500deb308292f05852b732112474dba5e9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP16/text-detection-0003.xml
   - name: FP16/text-detection-0003.bin
-    size: 13493008
-    sha256: 0ee50f6aad475bf34116f809278766e0ecc82a648bbde40e2070c2e36f62ace7
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/FP16/text-detection-0003.bin
-  - name: INT8/text-detection-0003.xml
-    size: 939308
-    sha256: 1b54398122719ead6bb98f9ac8d0d9cf73eac7787c547c08e485711dcdd76e0e
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/INT8/text-detection-0003.xml
-  - name: INT8/text-detection-0003.bin
-    size: 26986232
-    sha256: 5685f059522ae30cdbdef60317882988415fccc0e33950ed224b4d81d8e1a27c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0003/INT8/text-detection-0003.bin
+    size: 13493056
+    sha256: 84fc3ce490259047e3a48f2810f4cd2a38ad20c12a82f96e39f4ccb78b86b1f7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP16/text-detection-0003.bin
+  - name: FP32-INT8/text-detection-0003.xml
+    size: 557004
+    sha256: cec8d7e41ed77e4b2b23b5119dc2f390781de266ef193ea9fb357d1c690d138b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP32-INT8/text-detection-0003.xml
+  - name: FP32-INT8/text-detection-0003.bin
+    size: 27219792
+    sha256: 5eeffd8c051eba2661f87e43d08721576e0a346af569694a6859b748916233e1
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0003/FP32-INT8/text-detection-0003.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-detection-0004/model.yml b/models/intel/text-detection-0004/model.yml
index 50ad56b473e..08aee25979b 100644
--- a/models/intel/text-detection-0004/model.yml
+++ b/models/intel/text-detection-0004/model.yml
@@ -13,26 +13,32 @@
 # limitations under the License.
 
 description: >-
-  Text detector based on PixelLink <https://arxiv.org/pdf/1801.01315.pdf> architecture
-  with MobileNetV2, depth_multiplier=1.4 <(https://arxiv.org/pdf/1801.04381.pdf>
-  as a backbone for indoor/outdoor scenes.
+  Detects oriented text.
 task_type: detection
 files:
   - name: FP32/text-detection-0004.xml
-    size: 71958
-    sha256: 216e8c1124ef2bfe42c59db24c31402843f121d57a183b8c8e3c4e0dddb992ba
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0004/FP32/text-detection-0004.xml
+    size: 156938
+    sha256: 244f836e36d63c9bd45b2123f4b9e4672cae6be348c15cac857d75a8b9852dd7
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP32/text-detection-0004.xml
   - name: FP32/text-detection-0004.bin
-    size: 17312120
-    sha256: f6b58bf15c43cc017bd5f979b46b3159969968e47d3827de866d76d537931e1a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0004/FP32/text-detection-0004.bin
+    size: 17312168
+    sha256: 6da6456f27123be2d9a0e68bb73a7750f6aaee2f0af75d7f34ec6fa97f6727dc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP32/text-detection-0004.bin
   - name: FP16/text-detection-0004.xml
-    size: 71863
-    sha256: 049402345031d086583621e59f3ed5b913823589158c35f1115fb1cbb6bfdbcd
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0004/FP16/text-detection-0004.xml
+    size: 156841
+    sha256: a348b2b3adac52b92f15c21605f55fa75bf930ac1827871965c7eb9f71ad4a24
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP16/text-detection-0004.xml
   - name: FP16/text-detection-0004.bin
-    size: 8655952
-    sha256: 25b12925d0695af246ae68fbdf2ca1b61ac5b1f6b4b368386c2d82c880c93b70
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-detection-0004/FP16/text-detection-0004.bin
+    size: 8656000
+    sha256: 719639a52b46f94455ad8c2fb6d0e0bb98c485179f4321c558d5d88aacfbfd0e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP16/text-detection-0004.bin
+  - name: FP32-INT8/text-detection-0004.xml
+    size: 461347
+    sha256: 025f0b274e560189ba8a054dbbdef6ec09f0a697b5e79955472a5b142707ad0e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP32-INT8/text-detection-0004.xml
+  - name: FP32-INT8/text-detection-0004.bin
+    size: 17559056
+    sha256: fa2e973387c7b8a1e8d3165dae15e72e0537ef8e55eeae98081b0fb2b88676c6
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-detection-0004/FP32-INT8/text-detection-0004.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-image-super-resolution-0001/description/text-image-super-resolution-0001.md b/models/intel/text-image-super-resolution-0001/description/text-image-super-resolution-0001.md
index 85b5a308e0f..1a17850602f 100644
--- a/models/intel/text-image-super-resolution-0001/description/text-image-super-resolution-0001.md
+++ b/models/intel/text-image-super-resolution-0001/description/text-image-super-resolution-0001.md
@@ -35,7 +35,7 @@ support the `reshape` function.
 
 ## Inputs
 
-1. name: `0`, shape: [1x3x768x1280] - An input image in the format [BxCxHxW],
+1. name: `0`, shape: [1x1x360x640] - An input image in the format [BxCxHxW],
    where:
     - B - batch size
     - C - number of channels
diff --git a/models/intel/text-image-super-resolution-0001/model.yml b/models/intel/text-image-super-resolution-0001/model.yml
index 7eb17b37b8a..674e31e67ba 100644
--- a/models/intel/text-image-super-resolution-0001/model.yml
+++ b/models/intel/text-image-super-resolution-0001/model.yml
@@ -13,34 +13,32 @@
 # limitations under the License.
 
 description: >-
-  The tiny model to upscale scanned images with text. The model used `ConvTranspose2d`
-  layer instead of `PixelShuffle` as result the model can be launched on GPU and MYRIAD
-  devices and support `reshape` function.
+  Super resolution model
 task_type: image_processing
 files:
   - name: FP32/text-image-super-resolution-0001.xml
-    size: 5696
-    sha256: 7f5882d4e9c12d6a34ee79987489b0a72beaa192a613cdf4f7f73c89425a1c49
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.xml
+    size: 11358
+    sha256: 2587a0ad10ea3fc04fb44d680d79662af6a2c9613c9c0e0c3107be9b1a96e18c
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.xml
   - name: FP32/text-image-super-resolution-0001.bin
     size: 10836
     sha256: 033d58430a2744302a2729291d66d4c74ee6bce517b6ae36f1b5a0e8b27d82ff
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.bin
   - name: FP16/text-image-super-resolution-0001.xml
-    size: 5686
-    sha256: 030c87cc1269536882fe26cc822382223e5da46de98d077b2a711a3c0788ad66
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.xml
+    size: 11348
+    sha256: 3b99523e38d4a178448b7801d9483232bf9168ab183c681c8649d1f02ebc3920
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.xml
   - name: FP16/text-image-super-resolution-0001.bin
     size: 5418
     sha256: f203818d73b933e5004aff85aeb84783dbf0be9e5c296d2995fc0678ff719e9c
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.bin
-  - name: INT8/text-image-super-resolution-0001.xml
-    size: 5268
-    sha256: 6aec2e36d6e891ea4098a4a401bc048e770a43bfc169a6f80406d95eeeabbf67
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/INT8/text-image-super-resolution-0001.xml
-  - name: INT8/text-image-super-resolution-0001.bin
-    size: 10836
-    sha256: 496b4c29fb9333fa0ced6ae3d60899b486b67dba9bf37d28b83c8acd03c2b004
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-image-super-resolution-0001/INT8/text-image-super-resolution-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.bin
+  - name: FP32-INT8/text-image-super-resolution-0001.xml
+    size: 27041
+    sha256: 1a1a41f0c325ca9befc70ba7e42170c5213a0474f755d3d56563b28f96b5ee19
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP32-INT8/text-image-super-resolution-0001.xml
+  - name: FP32-INT8/text-image-super-resolution-0001.bin
+    size: 11228
+    sha256: f1680f577b003e5d6674d5b2d07277171487dac7707dbd18b686755e438127aa
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-image-super-resolution-0001/FP32-INT8/text-image-super-resolution-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-recognition-0012/model.yml b/models/intel/text-recognition-0012/model.yml
index 8d8478be27c..75d206bc74b 100644
--- a/models/intel/text-recognition-0012/model.yml
+++ b/models/intel/text-recognition-0012/model.yml
@@ -13,26 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is a network for text recognition scenario. It consists of VGG16-like backbone
-  and bidirectional LSTM encoder-decoder. The network is able to recognize case-insensitive
-  alpha-numeric text (36 unique symbols).
+  Recognizes alphanumeric text. Architecture: VGG-like + BiLSTM as an encoder -  BiLSTM
+  as a decoder.
 task_type: optical_character_recognition
 files:
   - name: FP32/text-recognition-0012.xml
-    size: 50415
-    sha256: e0f7979f11d7a7034ab60a66e83d6a48bb39a3f51987fd1aa942d90d11dd1f2d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-recognition-0012/FP32/text-recognition-0012.xml
+    size: 97700
+    sha256: 54fd8ae6ea5ae11fdeb85f5c6b701793c28883f1e3dd8c3a531c43db6c3713ea
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP32/text-recognition-0012.xml
   - name: FP32/text-recognition-0012.bin
-    size: 47470764
-    sha256: df7426c3a16c005eda3c9efc6afeefe38259b36748819fc0b28f3d2a67c16239
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-recognition-0012/FP32/text-recognition-0012.bin
+    size: 47470852
+    sha256: b0d99549692baeea3e83709a671844a365b15bd40e36d9a5d3ef5368a69d2897
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP32/text-recognition-0012.bin
   - name: FP16/text-recognition-0012.xml
-    size: 50395
-    sha256: c272907c678f637b7eea5c6b5a72c07564864fca2224a78756c6add527c0df87
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-recognition-0012/FP16/text-recognition-0012.xml
+    size: 97668
+    sha256: dd971f01660f3395e51d7983f5b4d70ac99764efaa3db99a9c52cdac378ed2a0
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP16/text-recognition-0012.xml
   - name: FP16/text-recognition-0012.bin
-    size: 23735394
-    sha256: 657f2b3fdcab897980f976692bb0b93bd05f7b29b111bfe518726ef5c835c786
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/text-recognition-0012/FP16/text-recognition-0012.bin
+    size: 23735478
+    sha256: 33294d251264f6913f0cc1f8a6463318becb5b70757984b461e5a865921b8d65
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP16/text-recognition-0012.bin
+  - name: FP32-INT8/text-recognition-0012.xml
+    size: 131724
+    sha256: 668efb97ddb90a8c8c6796b3d7d06eee49d4c9bf03f26be99ace5a263681a61b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP32-INT8/text-recognition-0012.xml
+  - name: FP32-INT8/text-recognition-0012.bin
+    size: 47489632
+    sha256: 9df4967adc31b20314ac140b3927e98d7c212abe257eaa697955052b8e7a3674
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-recognition-0012/FP32-INT8/text-recognition-0012.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-spotting-0001-detector/description/text-spotting-0001-detector.md b/models/intel/text-spotting-0001-detector/description/text-spotting-0001-detector.md
new file mode 100644
index 00000000000..7ec7d1439aa
--- /dev/null
+++ b/models/intel/text-spotting-0001-detector/description/text-spotting-0001-detector.md
@@ -0,0 +1,53 @@
+# text-spotting-0001-detector
+
+## Use Case and High-Level Description
+
+This is a text spotting model that simultaneously detects and
+recognizes text. The model detects symbol sequences separated by space and performs
+recognition without a dictionary. The model is built on top of the Mask-RCNN
+framework with additional attention-based text recognition head.
+
+Symbols set is alphanumeric: `0123456789abcdefghijklmnopqrstuvwxyz`.
+
+This model is a Mask-RCNN-based text detector with ResNet50 backbone and additional text features output.
+
+## Example
+
+![](./text-spotting-0001.png)
+
+## Specification
+
+| Metric                                        | Value     |
+|-----------------------------------------------|-----------|
+| Word spotting hmean ICDAR2015, without a dictionary | 59.04%    |
+| Detection hmean ICDAR2015                     | 87.09%    |
+| GFlops                                        | 185.169   |
+| MParams                                       | 26.497    |
+| Source framework                              | PyTorch\* |
+
+*Hmean Word spotting* is defined and measured according to the
+[Incidental Scene Text (ICDAR2015) challenge](https://rrc.cvc.uab.es/?ch=4&com=introduction).
+
+## Performance
+
+## Inputs
+
+1.	Name: `im_data` , shape: [1x3x768x1280]. An input image in the [1xCxHxW] format. 
+    The expected channel order is BGR.
+2.	Name: `im_info`, shape: [1x3]. Image information: processed image height,
+    processed image width and processed image scale with respect to the original image resolution.
+
+## Outputs
+
+1.	Name: `classes`, shape: [100]. Contiguous integer class ID for every
+    detected object, `0` for background (no object detected).
+1.	Name: `scores`, shape: [100]. Detection confidence scores in the [0, 1] range 
+    for every object.
+1.	Name: `boxes`, shape: [100x4]. Bounding boxes around every detected object
+    in the (top_left_x, top_left_y, bottom_right_x, bottom_right_y) format.
+1.	Name: `raw_masks`, shape: [100x2x28x28]. Segmentation heatmaps for all
+    classes for every output bounding box.
+1.  Name: `text_features`, shape [100x64x28x28]. Text features that are fed to a text recognition head.
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/text-spotting-0001-detector/description/text-spotting-0001.png b/models/intel/text-spotting-0001-detector/description/text-spotting-0001.png
new file mode 100644
index 00000000000..d80aa3adbeb
Binary files /dev/null and b/models/intel/text-spotting-0001-detector/description/text-spotting-0001.png differ
diff --git a/models/intel/text-spotting-0001-detector/model.yml b/models/intel/text-spotting-0001-detector/model.yml
new file mode 100644
index 00000000000..e416c4eda5b
--- /dev/null
+++ b/models/intel/text-spotting-0001-detector/model.yml
@@ -0,0 +1,36 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Mask-RCNN-based text detector.
+task_type: detection
+files:
+  - name: FP32/text-spotting-0001-detector.xml
+    size: 275850
+    sha256: 850eeabbd8f371292fefc84132d37431efe4feb09fc1f437f05621b31cec344e
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-detector/FP32/text-spotting-0001-detector.xml
+  - name: FP32/text-spotting-0001-detector.bin
+    size: 105906904
+    sha256: 3a4e3e7c3d0673a778882f5e6aaa217128473e79c5cb90c614d77ad25a108d42
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-detector/FP32/text-spotting-0001-detector.bin
+  - name: FP16/text-spotting-0001-detector.xml
+    size: 275736
+    sha256: f36f7bff89dfc4c35b76107453c665ddb3837c7b5ac10755107fffc0e29acec6
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-detector/FP16/text-spotting-0001-detector.xml
+  - name: FP16/text-spotting-0001-detector.bin
+    size: 52953494
+    sha256: 776648224b38f5023606b52f1782f4423b56ff588de8a7b7ea15c5e0fca15eb8
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-detector/FP16/text-spotting-0001-detector.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001-recognizer-decoder.md b/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001-recognizer-decoder.md
new file mode 100644
index 00000000000..02971f77837
--- /dev/null
+++ b/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001-recognizer-decoder.md
@@ -0,0 +1,46 @@
+# text-spotting-0001-recognizer-decoder
+
+## Use Case and High-Level Description
+
+This is a text spotting model that simultaneously detects and
+recognizes text. The model detects symbol sequences separated by space and performs
+recognition without a dictionary. The model is built on top of the Mask-RCNN
+framework with additional attention-based text recognition head.
+
+Symbols set is alphanumeric: `0123456789abcdefghijklmnopqrstuvwxyz`.
+
+This model is 2D attention-based GRU decoder of text recognition head.
+
+
+## Example
+
+![](./text-spotting-0001.png)
+
+## Specification
+
+| Metric                                        | Value     |
+|-----------------------------------------------|-----------|
+| Word spotting hmean ICDAR2015, without a dictionary | 59.04%    |
+| GFlops                                        | 0.002     |
+| MParams                                       | 0.273     |
+| Source framework                              | PyTorch\* |
+
+*Hmean Word spotting* is defined and measured according to the
+[Incidental Scene Text (ICDAR2015) challenge](https://rrc.cvc.uab.es/?ch=4&com=introduction).
+
+## Performance
+
+## Inputs
+
+1.	Name: `encoder_outputs` , shape: [1x256x64x64]. Encoded text recognition features.
+1.	Name: `prev_symbol` , shape: [1x1]. Index in alphabet of previously generated symbol.
+1.	Name: `prev_hidden`, shape: [1x1x256]. Previous hidden state of GRU.
+
+## Outputs
+
+1.	Name: `output`, shape: [1x256x64x64]. Encoded text recognition features.
+1.	Name: `hidden`, shape: [1x1x256]. Current hidden state of GRU.
+
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001.png b/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001.png
new file mode 100644
index 00000000000..d80aa3adbeb
Binary files /dev/null and b/models/intel/text-spotting-0001-recognizer-decoder/description/text-spotting-0001.png differ
diff --git a/models/intel/text-spotting-0001-recognizer-decoder/model.yml b/models/intel/text-spotting-0001-recognizer-decoder/model.yml
new file mode 100644
index 00000000000..de20c098f19
--- /dev/null
+++ b/models/intel/text-spotting-0001-recognizer-decoder/model.yml
@@ -0,0 +1,37 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Decoder part of text recognition head that takes encoder features from text-spotting-0001-text-recognizer-encoder
+  as input.
+task_type: optical_character_recognition
+files:
+  - name: FP32/text-spotting-0001-recognizer-decoder.xml
+    size: 30545
+    sha256: c161afda8cd45ee21934c74aec49321855651c3286921f5b6909da0e0bc0b626
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-decoder/FP32/text-spotting-0001-recognizer-decoder.xml
+  - name: FP32/text-spotting-0001-recognizer-decoder.bin
+    size: 2707804
+    sha256: 00cb0cef419a01661ca1c1b9977b1edebe581427dd28a593ba34505971544303
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-decoder/FP32/text-spotting-0001-recognizer-decoder.bin
+  - name: FP16/text-spotting-0001-recognizer-decoder.xml
+    size: 30529
+    sha256: f4eb268b589327d7bdc22ea7c084aa88cc36dd1eec9855ec9f17890b9b26154a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-decoder/FP16/text-spotting-0001-recognizer-decoder.xml
+  - name: FP16/text-spotting-0001-recognizer-decoder.bin
+    size: 1354000
+    sha256: 58fb88820edf08b2809f2f7d7c563c86082b13342f01206ffc98707ed2a66948
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-decoder/FP16/text-spotting-0001-recognizer-decoder.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001-recognizer-encoder.md b/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001-recognizer-encoder.md
new file mode 100644
index 00000000000..953ce5ea68a
--- /dev/null
+++ b/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001-recognizer-encoder.md
@@ -0,0 +1,42 @@
+# text-spotting-0001-recognizer-encoder
+
+## Use Case and High-Level Description
+
+This is a text spotting model that simultaneously detects and
+recognizes text. The model detects symbol sequences separated by space and performs
+recognition without a dictionary. The model is built on top of the Mask-RCNN
+framework with additional attention-based text recognition head.
+
+Symbols set is alphanumeric: `0123456789abcdefghijklmnopqrstuvwxyz`.
+
+This model is a fully-convolutional encoder of text recognition head.
+
+## Example
+
+![](./text-spotting-0001.png)
+
+## Specification
+
+| Metric                                        | Value     |
+|-----------------------------------------------|-----------|
+| Word spotting hmean ICDAR2015, without a dictionary | 59.04%    |
+| GFlops                                        | 2.082     |
+| MParams                                       | 1.328     |
+| Source framework                              | PyTorch\* |
+
+*Hmean Word spotting* is defined and measured according to the
+[Incidental Scene Text (ICDAR2015) challenge](https://rrc.cvc.uab.es/?ch=4&com=introduction).
+
+## Performance
+
+## Inputs
+
+Name: `input` , shape: [1x64x28x28]. Text recognition features obtained from detection part.
+
+## Outputs
+
+Name: `output`, shape: [1x256x64x64]. Encoded text recognition features.
+
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001.png b/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001.png
new file mode 100644
index 00000000000..d80aa3adbeb
Binary files /dev/null and b/models/intel/text-spotting-0001-recognizer-encoder/description/text-spotting-0001.png differ
diff --git a/models/intel/text-spotting-0001-recognizer-encoder/model.yml b/models/intel/text-spotting-0001-recognizer-encoder/model.yml
new file mode 100644
index 00000000000..045a9edc8bc
--- /dev/null
+++ b/models/intel/text-spotting-0001-recognizer-encoder/model.yml
@@ -0,0 +1,37 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Encoder part of text recognition head that takes features from text-spotting-0001-detector
+  as input.
+task_type: feature_extraction
+files:
+  - name: FP32/text-spotting-0001-recognizer-encoder.xml
+    size: 9908
+    sha256: 2c088d1a1e3e21a31038022f4000f2604d34b53d0f3f84c7c99bca146890dfce
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-encoder/FP32/text-spotting-0001-recognizer-encoder.xml
+  - name: FP32/text-spotting-0001-recognizer-encoder.bin
+    size: 5311488
+    sha256: df3b4d491c953b022afbed4e0492b8f41046da3a6d3c65054884ac15af135942
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-encoder/FP32/text-spotting-0001-recognizer-encoder.bin
+  - name: FP16/text-spotting-0001-recognizer-encoder.xml
+    size: 9905
+    sha256: 8f9f51992f22d8d7b1588757cc1f71c712132d522bd439c38a298de980daf9ea
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-encoder/FP16/text-spotting-0001-recognizer-encoder.xml
+  - name: FP16/text-spotting-0001-recognizer-encoder.bin
+    size: 2655744
+    sha256: e0a2315c344e2adf69c31b24faa16fdc9496f48a9ba98c25ecef640f23710517
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/text-spotting-0001-recognizer-encoder/FP16/text-spotting-0001-recognizer-encoder.bin
+framework: dldt
+license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md b/models/intel/unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md
new file mode 100644
index 00000000000..0004dcde497
--- /dev/null
+++ b/models/intel/unet-camvid-onnx-0001/description/unet-camvid-onnx-0001.md
@@ -0,0 +1,56 @@
+# unet-camvid-onnx-0001
+
+## Use Case and High-Level Description
+
+This is the UNet model that is designed to perform semantic segmentation. The model has been trained on the CamVid dataset from scratch using PyTorch framework. Training used median frequency balancing for class weighing. For details about the original floating point model, check out the [paper](https://arxiv.org/pdf/1505.04597.pdf).
+
+The model input is a blob that consists of a single image of "1x3x368x480" in BGR order. The pixel values are integers in the [0, 255] range.
+
+The model output for `unet-camvid-onnx-0001` is the per-pixel probabilities of each input pixel belonging to one of the 12 classes of the CamVid dataset.
+
+## Specification
+
+| Metric            | Value                 |
+|-------------------|-----------------------|
+| GFlops            | 260.1                 |
+| MParams           | 31.03                 |
+| Source framework  | PyTorch\*             |
+
+## Accuracy
+
+The quality metrics were calculated on the CamVid validation dataset. The 'unlabeled' class had been ignored during metrics calculation.
+
+| Metric                    | Value         |
+|---------------------------|---------------|
+| mIoU                      |        71.95% |
+
+- `IOU=TP/(TP+FN+FP)`, where:
+  - `TP` - number of true positive pixels for given class
+  - `FN` - number of false negative pixels for given class
+  - `FP` - number of false positive pixels for given class
+
+
+## Performance
+
+## Input
+
+Image, shape - `1,3,368,480`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`
+
+## Output
+
+Semantic segmentation class probabilities map, shape -`1,12,368,480`, output data format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - predicted probabilities of input pixel belonging to class `C` in  [0, 1] range
+- `H` - horizontal coordinate of the input pixel
+- `W` - vertical coordinate of the input pixel
+
+## Legal Information
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/intel/vehicle-attributes-recognition-barrier-0039/model.yml b/models/intel/vehicle-attributes-recognition-barrier-0039/model.yml
index ad7beb99aff..43358a171be 100644
--- a/models/intel/vehicle-attributes-recognition-barrier-0039/model.yml
+++ b/models/intel/vehicle-attributes-recognition-barrier-0039/model.yml
@@ -13,33 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This model presents a vehicle attributes classification algorithm for a traffic
-  analysis scenario.
+  Vehicle attributes recognition with modified ResNet10 backbone
 task_type: object_attributes
 files:
   - name: FP32/vehicle-attributes-recognition-barrier-0039.xml
-    size: 18179
-    sha256: 3d11a6c9920fd32ea34d59fe31a1f5e21fa2e112616c962dbdcb2c8f5afe5f42
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/FP32/vehicle-attributes-recognition-barrier-0039.xml
+    size: 33367
+    sha256: b61160182cf8f3a67939d4d6cc837a1bcfd5cf0f443cea836ea23cc6bc0ec9d4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP32/vehicle-attributes-recognition-barrier-0039.xml
   - name: FP32/vehicle-attributes-recognition-barrier-0039.bin
-    size: 2504004
-    sha256: 8195ea60216d9aefdab41e3129900aa847f4f0d3d003ce93aa15ecba0ca18e91
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/FP32/vehicle-attributes-recognition-barrier-0039.bin
+    size: 2504020
+    sha256: 26594e8bfc4e8de30a2186f4c30cfd44b82a4f4b4656fb32aa12d4f4888c832a
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP32/vehicle-attributes-recognition-barrier-0039.bin
   - name: FP16/vehicle-attributes-recognition-barrier-0039.xml
-    size: 18165
-    sha256: e96f15c82e7bdc549c517d39ee6fe5364319748e99de9d75b09b7b2ab0802488
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml
+    size: 33349
+    sha256: 8eedb7bbec7d5dc514ed107ff47e316cf0b002d977141394871fb7b21fb32c93
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.xml
   - name: FP16/vehicle-attributes-recognition-barrier-0039.bin
-    size: 1252002
-    sha256: be8b61e337a23ffa57d1742f92d2317560303652f330fef0cbe918161bfcaf50
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.bin
-  - name: INT8/vehicle-attributes-recognition-barrier-0039.xml
-    size: 64190
-    sha256: b416777d0ba15c4a525f04baa66835671528d1ca974d298c9b79facc0aa4a8ab
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/INT8/vehicle-attributes-recognition-barrier-0039.xml
-  - name: INT8/vehicle-attributes-recognition-barrier-0039.bin
-    size: 2504004
-    sha256: 4ca9587b866ecc92418b87424ec5becb05f73a9781cd2eab6abeff7a54067590
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-attributes-recognition-barrier-0039/INT8/vehicle-attributes-recognition-barrier-0039.bin
+    size: 1252018
+    sha256: aed57f9cfdfc7dbd8955c5f6b15966bd0131050129835e2046451f06e4bde7b9
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP16/vehicle-attributes-recognition-barrier-0039.bin
+  - name: FP32-INT8/vehicle-attributes-recognition-barrier-0039.xml
+    size: 87151
+    sha256: 0811f4541784e32f792e32b42e38c75ef202e16c0e9b5fd01122afb277763fce
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP32-INT8/vehicle-attributes-recognition-barrier-0039.xml
+  - name: FP32-INT8/vehicle-attributes-recognition-barrier-0039.bin
+    size: 2512408
+    sha256: 649ee0087b451d4d9099156452a2b80092b5af673fc457f0cdd6cd6fd1aa05a4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-attributes-recognition-barrier-0039/FP32-INT8/vehicle-attributes-recognition-barrier-0039.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/vehicle-detection-adas-0002/model.yml b/models/intel/vehicle-detection-adas-0002/model.yml
index 0aef50c7132..4790dfe2ec7 100644
--- a/models/intel/vehicle-detection-adas-0002/model.yml
+++ b/models/intel/vehicle-detection-adas-0002/model.yml
@@ -13,33 +13,33 @@
 # limitations under the License.
 
 description: >-
-  This is a vehicle detection network based on an SSD framework with tuned MobileNet
-  v1 as a feature extractor.
+  Vehicle detector based on SSD + MobileNet with reduced number of channels and depthwise
+  head.
 task_type: detection
 files:
   - name: FP32/vehicle-detection-adas-0002.xml
-    size: 80175
-    sha256: 0b42cb57a28284801a671994fd90da5d2312a7ed7e0b120975ace706ea064e80
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.xml
+    size: 216043
+    sha256: b58c126cc2cf025442dd614159b0a6061c236eaecf8ae5f9d136b7b312499b31
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.xml
   - name: FP32/vehicle-detection-adas-0002.bin
-    size: 4314468
-    sha256: bafe8ad70bb232e2b35928a31b9a4d3c7d4a6d6995b6bf2012c0ba9674f9d66d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.bin
+    size: 4314552
+    sha256: 6d0e114769bed9c8bd6666e098f891d7c158508bd7db6ba2bd4d09de17db1b69
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.bin
   - name: FP16/vehicle-detection-adas-0002.xml
-    size: 80128
-    sha256: 87ce16187683eeec1bb623d1b936e1f7253588f4d7b9376eeb7f6a1b3a78f5a9
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.xml
+    size: 215993
+    sha256: 3f68133b27949aae53f2fa118be8d980c91a87f8112f8fd84ab2dc0c77e13754
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.xml
   - name: FP16/vehicle-detection-adas-0002.bin
-    size: 2157240
-    sha256: f2ce728a0140da04f1c7cb3726e73b8868055bc59518ed2bdd2de3a787dbf8cb
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.bin
-  - name: INT8/vehicle-detection-adas-0002.xml
-    size: 3811792
-    sha256: f630d81c9f05eb76f5e539d6026f45437af6b448ba5211bdff95431008249ea8
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/INT8/vehicle-detection-adas-0002.xml
-  - name: INT8/vehicle-detection-adas-0002.bin
-    size: 4314468
-    sha256: a7bf4a5edbc278a2d25ef33541958170670f346baf9dd07e6b02fc5618ba4a63
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-0002/INT8/vehicle-detection-adas-0002.bin
+    size: 2157328
+    sha256: e119b3bec50bc836f2eb26a56a40a6d5e3c33bde819f3e6d00f829978092742b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.bin
+  - name: FP32-INT8/vehicle-detection-adas-0002.xml
+    size: 438606
+    sha256: b7b2531985b025f42e40251ae1151a204e38c8db83ae1d4b565a8ce729cf1156
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP32-INT8/vehicle-detection-adas-0002.xml
+  - name: FP32-INT8/vehicle-detection-adas-0002.bin
+    size: 4389736
+    sha256: 9fe53648e0a377c00e8b985817cd25dad320008e8d0a1048af4ac88aabf1a929
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-0002/FP32-INT8/vehicle-detection-adas-0002.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md b/models/intel/vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md
index fff83ca8b25..35f945555f4 100644
--- a/models/intel/vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md
+++ b/models/intel/vehicle-detection-adas-binary-0001/description/vehicle-detection-adas-binary-0001.md
@@ -19,7 +19,7 @@ This detecector was created by binarization the vehicle-detection-adas-0002
 | GFlops                          | 0.75                                      |
 | GI1ops                          | 2.048                                     |
 | MParams                         | 1.079                                     |
-| Source framework                | Pytorch*                                  |
+| Source framework                | PyTorch*                                  |
 
 Average Precision metric described in: Mark Everingham et al.
 ["The PASCAL Visual Object Classes (VOC) Challenge"](http://host.robots.ox.ac.uk/pascal/VOC/pubs/everingham10.pdf).
diff --git a/models/intel/vehicle-detection-adas-binary-0001/model.yml b/models/intel/vehicle-detection-adas-binary-0001/model.yml
index 555ede929f5..908246d8bff 100644
--- a/models/intel/vehicle-detection-adas-binary-0001/model.yml
+++ b/models/intel/vehicle-detection-adas-binary-0001/model.yml
@@ -13,18 +13,17 @@
 # limitations under the License.
 
 description: >-
-  This is a vehicle detection network based on an SSD framework with tuned MobileNet
-  v1 as a feature extractor and using binary layer for speedup. This detecector
-  was created by binarization the vehicle-detection-adas-0002
+  Vehicle detector based on SSD + MobileNet with reduced number of channels and depthwise
+  head and binary layers.
 task_type: detection
 files:
-  - name: INT1/vehicle-detection-adas-binary-0001.xml
+  - name: FP32-INT1/vehicle-detection-adas-binary-0001.xml
     size: 105969
     sha256: c98bf5984895b1309861597ec36181446877407cd985bb490e14461f41312670
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-binary-0001/INT1/vehicle-detection-adas-binary-0001.xml
-  - name: INT1/vehicle-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-binary-0001/FP32-INT1/vehicle-detection-adas-binary-0001.xml
+  - name: FP32-INT1/vehicle-detection-adas-binary-0001.bin
     size: 2160500
     sha256: afdd8a2f175b2f19c07083ff23b2e28105f3d1c7dc06a4b1a1d5c2c42b98294f
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-detection-adas-binary-0001/INT1/vehicle-detection-adas-binary-0001.bin
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-detection-adas-binary-0001/FP32-INT1/vehicle-detection-adas-binary-0001.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/intel/vehicle-license-plate-detection-barrier-0106/model.yml b/models/intel/vehicle-license-plate-detection-barrier-0106/model.yml
index 360b79cfa57..c05d7368374 100644
--- a/models/intel/vehicle-license-plate-detection-barrier-0106/model.yml
+++ b/models/intel/vehicle-license-plate-detection-barrier-0106/model.yml
@@ -13,33 +13,32 @@
 # limitations under the License.
 
 description: >-
-  This is a MobileNetV2 + SSD-based vehicle and (Chinese) license plate detector
-  for the "Barrier" use case.
+  Multiclass (vehicle -  license plates) detector based on MobileNetV2+SSD
 task_type: detection
 files:
   - name: FP32/vehicle-license-plate-detection-barrier-0106.xml
-    size: 100057
-    sha256: d17983e551fa9f98227fb4374e59e360d5d3a0ffeb1e29e5eae0ef62c47b30e2
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.xml
+    size: 204476
+    sha256: 0c4abcf31945d04fc33459625988176ade8e0986a8e2b4499c1ec511177217a4
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.xml
   - name: FP32/vehicle-license-plate-detection-barrier-0106.bin
-    size: 2573296
-    sha256: 0d986cddcc0c497c4ffe03619967b1da8743bfa031357945377715c4ab7fae1d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.bin
+    size: 2573380
+    sha256: 2a6f1cd0eb8731ef059a91299bce0be026d2cebb1ae42cbee37b6aef7da2764b
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.bin
   - name: FP16/vehicle-license-plate-detection-barrier-0106.xml
-    size: 99989
-    sha256: 35c9d015243462de13410c5695d3d83533308a092dcef8c7a767ab60e75a8b1d
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml
+    size: 204408
+    sha256: 6fc62d36f52ccfa34eced7c8e3c260e9870a8b5c42fe413a76a1321f10a637dc
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml
   - name: FP16/vehicle-license-plate-detection-barrier-0106.bin
-    size: 1286674
-    sha256: c23eee855d2049c864e6e242bd73f0be38b7550cc92103df36ca04d1ca894d39
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.bin
-  - name: INT8/vehicle-license-plate-detection-barrier-0106.xml
-    size: 893115
-    sha256: dbcccae712f53a6e1c18b196effc30d5a0b7900fbe040483802b466d42df1c6a
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/INT8/vehicle-license-plate-detection-barrier-0106.xml
-  - name: INT8/vehicle-license-plate-detection-barrier-0106.bin
-    size: 2573400
-    sha256: e672e03e13630b9a5bceccaf149563c66c1915dc22aa0d613404cd30dec48274
-    source: https://download.01.org/opencv/2019/open_model_zoo/R3/20190905_163000_models_bin/vehicle-license-plate-detection-barrier-0106/INT8/vehicle-license-plate-detection-barrier-0106.bin
+    size: 1286758
+    sha256: 57652e098f93ee712eb412267612cb7bf2713475f96ec1e18eca10e4bef69785
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.bin
+  - name: FP32-INT8/vehicle-license-plate-detection-barrier-0106.xml
+    size: 519016
+    sha256: 0037685af2cc25f569c7db066ab6e9673a0faae204d8f2f19a003b28bd21bb28
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP32-INT8/vehicle-license-plate-detection-barrier-0106.xml
+  - name: FP32-INT8/vehicle-license-plate-detection-barrier-0106.bin
+    size: 2642612
+    sha256: 2f81d5803d76e90f9000c17083536ece01e7127c407e5bec7a6caef07ac01082
+    source: https://download.01.org/opencv/2020/openvinotoolkit/2020.1/open_model_zoo/models_bin/1/vehicle-license-plate-detection-barrier-0106/FP32-INT8/vehicle-license-plate-detection-barrier-0106.bin
 framework: dldt
 license: https://raw.githubusercontent.com/opencv/open_model_zoo/master/LICENSE
diff --git a/models/public/Sphereface/Sphereface.md b/models/public/Sphereface/Sphereface.md
index 429d21ec8b8..72969f64db0 100644
--- a/models/public/Sphereface/Sphereface.md
+++ b/models/public/Sphereface/Sphereface.md
@@ -48,7 +48,7 @@ Channel order is `BGR`.
 
 ### Original model
 
-Face embedings, name - `fc5`,  shape - `1,512`, output data format  - `B,C`, where:
+Face embeddings, name - `fc5`,  shape - `1,512`, output data format  - `B,C`, where:
 
 - `B` - batch size
 - `C` - row-vector of 512 floating points values, face embeddings
@@ -57,7 +57,7 @@ The net outputs on different images are comparable in cosine distance.
 
 ### Converted model
 
-Face embedings, name - `fc5`,  shape - `1,512`, output data format  - `B,C`, where:
+Face embeddings, name - `fc5`,  shape - `1,512`, output data format  - `B,C`, where:
 
 - `B` - batch size
 - `C` - row-vector of 512 floating points values, face embeddings
@@ -66,4 +66,29 @@ The net outputs on different images are comparable in cosine distance.
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/wy1iu/sphereface/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/wy1iu/sphereface/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2017 Weiyang Liu and Yandong Wen
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/alexnet/alexnet.md b/models/public/alexnet/alexnet.md
index 8041948c737..81ea6829bd2 100644
--- a/models/public/alexnet/alexnet.md
+++ b/models/public/alexnet/alexnet.md
@@ -71,4 +71,9 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_alexnet/readme.md]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_alexnet/readme.md):
+
+```
+This model is released for unrestricted use.
+```
diff --git a/models/public/alexnet/model.yml b/models/public/alexnet/model.yml
index da6a56815c7..d24dc3d9087 100644
--- a/models/public/alexnet/model.yml
+++ b/models/public/alexnet/model.yml
@@ -13,16 +13,16 @@
 # limitations under the License.
 
 description: >-
-  The `alexnet` model is designed to perform image classification. Just like other
-  common classification models, the `alexnet` model has been pretrained on the
-  ImageNet image database. For details about this model, check out the paper <http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks.pdf>.
+  The "alexnet" model is designed to perform image classification. Just like other
+  common classification models, the "alexnet" model has been pretrained on the ImageNet
+  image database. For details about this model, check out the paper <http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks.pdf>.
 
-  The model input is a blob that consists of a single image of 1x3x227x227 in
-  BGR order. The BGR mean values need to be subtracted as follows: [104, 117,
-  123] before passing the image blob into the network.
+  The model input is a blob that consists of a single image of 1x3x227x227 in BGR
+  order. The BGR mean values need to be subtracted as follows: [104, 117, 123] before
+  passing the image blob into the network.
 
-  The model output for `alexnet` is the usual object classifier output for the
-  1000 different classifications matching those in the ImageNet database.
+  The model output for "alexnet" is the usual object classifier output for the 1000
+  different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: alexnet.prototxt
diff --git a/models/public/brain-tumor-segmentation-0001/brain-tumor-segmentation-0001.md b/models/public/brain-tumor-segmentation-0001/brain-tumor-segmentation-0001.md
index d8669e4f579..019846eb90c 100644
--- a/models/public/brain-tumor-segmentation-0001/brain-tumor-segmentation-0001.md
+++ b/models/public/brain-tumor-segmentation-0001/brain-tumor-segmentation-0001.md
@@ -82,4 +82,6 @@ With the following channels: `background`, `necrotic core`, `edema` and `enhanci
 
 ## Legal Information
 
-[https://github.com/lachinov/brats2018-graphlabunn/blob/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://github.com/lachinov/brats2018-graphlabunn/blob/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/brain-tumor-segmentation-0002/brain-tumor-segmentation-0002.md b/models/public/brain-tumor-segmentation-0002/brain-tumor-segmentation-0002.md
new file mode 100644
index 00000000000..d4a6b3e7a06
--- /dev/null
+++ b/models/public/brain-tumor-segmentation-0002/brain-tumor-segmentation-0002.md
@@ -0,0 +1,134 @@
+# Brain-tumor-segmentation-0002
+
+## Use Case and High-Level Description
+
+This model was created for participation in the [Brain Tumor Segmentation Challenge](https://www.med.upenn.edu/cbica/brats2019/registration.html) (BraTS) 2019. It has the UNet architecture trained with residual blocks.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Segmentation  |
+| GFLOPs            | 300.801       |
+| MParams           | 4.51          |
+| Source framework  | PyTorch\*       |
+
+## Accuracy
+
+See [BRATS 2019 Leaderboard](https://www.cbica.upenn.edu/BraTS19/lboardValidation.html). The metrics 
+for challenge validation (Dice_WT, Dice_TC, Dice_ET) differ from the metrics reported below (which 
+are compartible with input labels):
+
+- WT (whole tumor) class combines all three tumor classes:
+    - necrotic core / non-enhancing tumor
+    - edema
+    - enhancing tumor
+- TC (tumor core) combines the following classes:
+    - necrotic core
+    - non-enhancing tumor
+- ET (enhancing tumor)
+
+The following accuracy metrics are measured on a `brain tumor` training subset of the [Medical Decathlon](http://medicaldecathlon.com/) dataset. 
+
+**Mean**:
+- Dice index for "overall": 0.915
+- Dice index for "necrotic core / non-enhancing tumor": 0.806
+- Dice index for "edema": 0.611
+- Dice index for "enhancing tumor": 0.794
+
+**Median**:
+- Dice index for "overall": 0.927
+- Dice index for "necrotic core / non-enhancing tumor": 0.835
+- Dice index for "edema": 0.644
+- Dice index for "enhancing tumor": 0.86
+
+  
+> **NOTE**: The accuracy achieved with ONNX\* model adapted for OpenVINO™ can slightly differ from the accuracy achieved with the original PyTorch model since the upsampling operation was changed from the `trilinear` to `nearest` mode.
+
+## Performance
+
+## Input
+
+The model takes as an input four MRI modalities `T1`, `T1ce`, `T2`, `Flair`. Find additional information on the [BraTS 2019 page](https://www.med.upenn.edu/cbica/brats2019/registration.html) and [wiki](https://en.wikipedia.org/wiki/Magnetic_resonance_imaging).
+In the preprocessing pipeline, each modality should be z-score normalized separately. The input tensor is a concatenation of the four input modalities.
+
+### Original Model
+
+MR Image, name - `0`, shape - `1,4,128,128,128`, format is `B,C,D,H,W`, where:
+
+- `B` - batch size
+- `C` - channel
+- `D` - depth
+- `H` - height
+- `W` - width
+
+The channels are ordered as `T1`, `T1ce`, `T2`, `Flair`.
+
+### Converted Model
+
+MR Image, name - `0`, shape - `1,4,128,128,128`, format is `B,C,D,H,W`, where:
+
+- `B` - batch size
+- `C` - channel
+- `D` - depth
+- `H` - height
+- `W` - width
+
+The channels are ordered as `T1`, `T1ce`, `T2`, `Flair`.
+
+## Output
+
+### Original Model
+
+Probabilities of the given voxel to be in the corresponding class, name - `304`, shape - `1,3,128,128,128`, output data format is `B,C,D,H,W`, where:
+
+- `B` - batch size
+- `C` - channel
+- `D` - depth
+- `H` - height
+- `W` - width
+
+The channels are ordered as `whole tumor`, `tumor core`, and `enhancing tumor`.
+
+### Converted Model
+
+Probabilities of the given voxel to be in the corresponding class, name - `304`, shape - `1,3,128,128,128`, output data format is `B,C,D,H,W`, where:
+
+- `B` - batch size
+- `C` - channel
+- `D` - depth
+- `H` - height
+- `W` - width
+
+The channels are ordered as `whole tumor`, `tumor core`, and `enhancing tumor`.
+
+## Legal Information
+
+The original model is distributed under the
+[MIT License](https://raw.githubusercontent.com/lachinov/brats2019/master/LICENSE).
+
+```
+The MIT License
+
+Copyright (c) 2019 Dmitrii Lachinov
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+```
\ No newline at end of file
diff --git a/models/public/brain-tumor-segmentation-0002/model.yml b/models/public/brain-tumor-segmentation-0002/model.yml
new file mode 100644
index 00000000000..0e468f84287
--- /dev/null
+++ b/models/public/brain-tumor-segmentation-0002/model.yml
@@ -0,0 +1,31 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This model was created for participation in the Brain Tumor Segmentation Challenge
+  <https://www.med.upenn.edu/cbica/brats2019/registration.html> (BraTS) 2019. It has
+  the UNet architecture trained with residual blocks.
+task_type: semantic_segmentation
+files:
+  - name: brain-tumor-segmentation-0002.onnx
+    size: 21735156
+    sha256: 97726901bc4f0f2c5e583d38d0ff4631d92ebcdb18bf5e2e859c3703a9b86d2d
+    source:
+      $type: google_drive
+      id: 1NhH51NgKJKhu0Bax_IKQ_Byvoe2bItPX
+model_optimizer_args:
+  - --input_shape=[1,4,128,128,128]
+  - --input_model=$dl_dir/brain-tumor-segmentation-0002.onnx
+framework: onnx
+license: https://raw.githubusercontent.com/lachinov/brats2019/master/LICENSE
diff --git a/models/public/caffenet/caffenet.md b/models/public/caffenet/caffenet.md
index b4c6e2ef012..9b8c91dc866 100644
--- a/models/public/caffenet/caffenet.md
+++ b/models/public/caffenet/caffenet.md
@@ -58,4 +58,9 @@ probability for each class.
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_reference_caffenet/readme.md]()
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_reference_caffenet/readme.md):
+
+```
+This model is released for unrestricted use.
+```
diff --git a/models/public/caffenet/model.yml b/models/public/caffenet/model.yml
index bf339aee897..7ae41393b15 100644
--- a/models/public/caffenet/model.yml
+++ b/models/public/caffenet/model.yml
@@ -13,8 +13,7 @@
 # limitations under the License.
 
 description: >-
-  CaffeNet model. Used for classification. For details see paper
-  <https://arxiv.org/abs/1408.5093>.
+  CaffeNet* model is used for classification. For details see paper <https://arxiv.org/abs/1408.5093>.
 task_type: classification
 files:
   - name: bvlc_reference_caffenet.caffemodel
diff --git a/models/public/colorization-v2-norebal/colorization-v2-norebal.md b/models/public/colorization-v2-norebal/colorization-v2-norebal.md
new file mode 100644
index 00000000000..7c677596062
--- /dev/null
+++ b/models/public/colorization-v2-norebal/colorization-v2-norebal.md
@@ -0,0 +1,120 @@
+# colorization-v2-norebal
+
+## Use Case and High-Level Description
+
+The `colorization-v2-norebal` model is one of the [colorization](https://arxiv.org/pdf/1603.08511)
+group of models designed to perform image colorization. For details
+about this family of models, check out the [repository](https://github.com/richzhang/colorization).
+
+This model differs from model `colorization-v2` in that metrics did not take into account
+balancing of rare classes during training.
+
+Model consumes as input L-channel of LAB-image.
+Model give as output predict A- and B-channels of LAB-image.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Colorization  |
+| GFLOPs            | -             |
+| MParams           | -             |
+| Source framework  | Caffe\*       |
+
+## Accuracy
+
+The accuracy metrics calculated on ImageNet
+validation dataset using [VGG16](https://arxiv.org/pdf/1409.1556.pdf) caffe
+model and colorization as preprocessing.
+
+For preprocessing `rgb -> gray -> coloriaztion` recieved values:
+
+| Metric         | Value with preprocessing   | Value without preprocessing |
+|----------------|-----------------------------|-----------------------------|
+| Accuracy top-1 |                      57.24% |                      70.96% |
+| Accuracy top-5 |                      80.96% |                      89.88% |
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `data_l`,  shape - `1,1,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is L-channel.
+Mean values - 50.
+
+### Converted model
+
+Image, name - `data_l`,  shape - `1,1,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is L-channel.
+
+## Output
+
+
+### Original model
+
+Image, name - `class8_ab`\*,  shape - `1,2,56,56`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+### Converted model
+
+Image, name - `class8_313_rh`\*,  shape - `1,313,56,56`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+> **NOTE**: `class8_313_rh` layer is in front of `class8_ab` layer,
+in order for network to work,
+you need to reproduce `class8_ab` layer with the coefficients that
+downloaded separately with the model.
+
+## Legal Information
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/richzhang/colorization/master/LICENSE):
+
+```
+Copyright (c) 2016, Richard Zhang, Phillip Isola, Alexei A. Efros
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/colorization-v2-norebal/model.yml b/models/public/colorization-v2-norebal/model.yml
new file mode 100644
index 00000000000..08442402467
--- /dev/null
+++ b/models/public/colorization-v2-norebal/model.yml
@@ -0,0 +1,53 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+    The colorization-v2-norebal model is one of the colorization
+    group of models designed to perform image colorization. For details
+    about this family of models, check out the repository - https://github.com/richzhang/colorization.
+
+    This model differs from model `colorization-v2` in that metrics did not take into account
+    balancing of rare classes during training.
+
+    Model consumes as input L-channel of LAB-image.
+    Model give as output predict A- and B-channels of LAB-image.
+
+task_type: "colorization"
+files:
+  - name: colorization-v2-norebal.prototxt
+    sha256: d16418cef8df4ccd703a55ae0ef3960861d5010418f77c90d0a47689998a7169
+    source: https://raw.githubusercontent.com/richzhang/colorization/master/models/colorization_deploy_v2.prototxt
+    size: 9945
+  - name: colorization-v2-norebal.caffemodel
+    size: 128946454
+    sha256: 6ab42a7fa853eb7ca822b9a0a2997a08a29c819c985c3e70b460c6be9c8b2159
+    source: https://people.eecs.berkeley.edu/~rich.zhang/projects/2016_colorization/files/demo_v2/colorization_release_v2_norebal.caffemodel
+  - name: colorization-v2-norebal.npy
+    size: 5088
+    sha256: b5dec01315c34f43f1c8c089e84c45ae35d1838d8e77ed0e7ca930f79ffa450e
+    source: https://github.com/richzhang/colorization/raw/master/resources/pts_in_hull.npy
+model_optimizer_args:
+  - --input_shape=[1,1,224,224]
+  - --input=data_l
+  - --mean_values=data_l[50]
+  - --output=class8_313_rh
+  - --input_model=$dl_dir/colorization-v2-norebal.caffemodel
+  - --input_proto=$dl_dir/colorization-v2-norebal.prototxt
+postprocessing:
+  - $type: regex_replace
+    file: colorization-v2-norebal.prototxt
+    pattern: 'layer {\n  name: "Silence"\n  type: "Silence"\n  bottom: "class8_ab"\n}'
+    replacement: ''
+framework: caffe
+license: https://raw.githubusercontent.com/richzhang/colorization/master/LICENSE
diff --git a/models/public/colorization-v2/colorization-v2.md b/models/public/colorization-v2/colorization-v2.md
new file mode 100644
index 00000000000..07ebba1b892
--- /dev/null
+++ b/models/public/colorization-v2/colorization-v2.md
@@ -0,0 +1,117 @@
+# colorization-v2
+
+## Use Case and High-Level Description
+
+The `colorization-v2` model is one of the [colorization](https://arxiv.org/pdf/1603.08511)
+group of models designed to perform image colorization. For details
+about this family of models, check out the [repository](https://github.com/richzhang/colorization).
+
+Model consumes as input L-channel of LAB-image.
+Model give as output predict A- and B-channels of LAB-image.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Colorization  |
+| GFLOPs            | -             |
+| MParams           | -             |
+| Source framework  | Caffe\*       |
+
+## Accuracy
+
+The accuracy metrics calculated on ImageNet
+validation dataset using [VGG16](https://arxiv.org/pdf/1409.1556.pdf) caffe
+model and colorization as preprocessing.
+
+For preprocessing `rgb -> gray -> coloriaztion` recieved values:
+
+| Metric         | Value with preprocessing   | Value without preprocessing |
+|----------------|-----------------------------|-----------------------------|
+| Accuracy top-1 |                      55.39% |                      70.96% |
+| Accuracy top-5 |                      79.21% |                      89.88% |
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `data_l`,  shape - `1,1,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is L-channel.
+Mean values - 50.
+
+### Converted model
+
+Image, name - `data_l`,  shape - `1,1,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is L-channel.
+
+## Output
+
+### Original model
+
+Image, name - `class8_ab`\*,  shape - `1,2,56,56`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+### Converted model
+
+Image, name - `class8_313_rh`\*,  shape - `1,313,56,56`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+> **NOTE**: `class8_313_rh` layer is in front of `class8_ab` layer,
+in order for network to work,
+you need to reproduce `class8_ab` layer with the coefficients that
+downloaded separately with the model. More detailed information can be found
+>[this](https://github.com/richzhang/colorization/blob/master/demo/colorization_demo_v2.ipynb).
+
+## Legal Information
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/richzhang/colorization/master/LICENSE):
+
+```
+Copyright (c) 2016, Richard Zhang, Phillip Isola, Alexei A. Efros
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/colorization-v2/model.yml b/models/public/colorization-v2/model.yml
new file mode 100644
index 00000000000..c3d9e594c3c
--- /dev/null
+++ b/models/public/colorization-v2/model.yml
@@ -0,0 +1,50 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+    The colorization-v2 model is one of the colorization
+    group of models designed to perform image colorization. For details
+    about this family of models, check out the repository - https://github.com/richzhang/colorization.
+
+    Model consumes as input L-channel of LAB-image.
+    Model give as output predict A- and B-channels of LAB-image.
+
+task_type: "colorization"
+files:
+  - name: colorization-v2.prototxt
+    sha256: d16418cef8df4ccd703a55ae0ef3960861d5010418f77c90d0a47689998a7169
+    source: https://raw.githubusercontent.com/richzhang/colorization/master/models/colorization_deploy_v2.prototxt
+    size: 9945
+  - name: colorization-v2.caffemodel
+    size: 128946764
+    sha256: f5af1e602646328c792e1094f9876fe9cd4c09ac46fa886e5708a1abc89137b1
+    source: http://eecs.berkeley.edu/~rich.zhang/projects/2016_colorization/files/demo_v2/colorization_release_v2.caffemodel
+  - name: colorization-v2.npy
+    size: 5088
+    sha256: b5dec01315c34f43f1c8c089e84c45ae35d1838d8e77ed0e7ca930f79ffa450e
+    source: https://github.com/richzhang/colorization/raw/master/resources/pts_in_hull.npy
+model_optimizer_args:
+  - --input_shape=[1,1,224,224]
+  - --input=data_l
+  - --mean_values=data_l[50]
+  - --output=class8_313_rh
+  - --input_model=$dl_dir/colorization-v2.caffemodel
+  - --input_proto=$dl_dir/colorization-v2.prototxt
+postprocessing:
+  - $type: regex_replace
+    file: colorization-v2.prototxt
+    pattern: 'layer {\n  name: "Silence"\n  type: "Silence"\n  bottom: "class8_ab"\n}'
+    replacement: ''
+framework: caffe
+license: https://raw.githubusercontent.com/richzhang/colorization/master/LICENSE
diff --git a/models/public/ctdet_coco_dlav0_384/ctdet_coco_dlav0_384.md b/models/public/ctdet_coco_dlav0_384/ctdet_coco_dlav0_384.md
new file mode 100644
index 00000000000..53a1f23e748
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_384/ctdet_coco_dlav0_384.md
@@ -0,0 +1,113 @@
+# ctdet_coco_dlav0_384
+
+## Use Case and High-Level Description
+
+CenterNet object detection model `ctdet_coco_dlav0_384` originally trained on PyTorch\*
+then converted to ONNX\* format. CenterNet models an object as a single point - the center point of its bounding box
+and uses keypoint estimation to find center points and regresses to object size.
+For details see [paper](http://arxiv.org/abs/1904.07850), [repository](https://github.com/xingyizhou/CenterNet/).
+
+### Steps to Reproduce PyTorch to ONNX Conversion
+Model is provided in ONNX format, which was obtained by the following steps.
+
+1. Clone the original repository
+```sh
+git clone https://github.com/xingyizhou/CenterNet
+cd CenterNet
+```
+2. Checkout the commit that the conversion was tested on:
+```sh
+git checkout 8ef87b4
+```
+3. Apply the `pytorch-onnx.patch` patch
+```sh
+git apply /path/to/pytorch-onnx.patch
+```
+4. Follow the original [installation steps](https://github.com/xingyizhou/CenterNet/blob/8ef87b4/readme/INSTALL.md)
+5. Download the [pretrained weights](https://drive.google.com/open?id=18yBxWOlhTo32_swSug_HM4q3BeWgxp_N)
+6. Run
+```sh
+python convert.py ctdet --load_model /path/to/downloaded/weights.pth --exp_id coco_dlav0_384 --arch dlav0_34 --input_res 384 --gpus -1
+```
+
+## Example
+
+## Specification
+
+| Metric                          | Value                                     |
+|---------------------------------|-------------------------------------------|
+| Type                            | Classification                            |
+| GFlops                          | 34.994                                    |
+| MParams                         | 17.911                                    |
+| Source framework                | PyTorch\*                                 |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| MAP    | 41.81          | 41.5            |
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name: `input.1`, shape: [1x3x384x384], format: [BxCxHxW]
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+   Mean values: [104.04, 113.985, 119.85], scale values: [73.695, 69.87, 70.89].
+
+### Converted Model
+
+Image, name: `input.1`, shape: [1x3x384x384], format: [BxCxHxW]
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+
+## Output
+
+1. Object center points heatmap, name: `508`. Contains predicted objects center point, for each of the 80 categories, according to MSCOCO\* dataset version with 80 categories of objects, without background label.
+2. Object size output, name: `511`. Contains predicted width and height for each object.
+3. Regression output, name: `514`. Contains offsets for each prediction.
+
+## Legal Information
+
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/xingyizhou/CenterNet/master/LICENSE)
+
+```
+MIT License
+
+Copyright (c) 2019 Xingyi Zhou
+All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/ctdet_coco_dlav0_384/model.yml b/models/public/ctdet_coco_dlav0_384/model.yml
new file mode 100644
index 00000000000..de75ee2d816
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_384/model.yml
@@ -0,0 +1,35 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  CenterNet object detection model "ctdet_coco_dlav0_384" originally trained on PyTorch*
+  then converted to ONNX* format. CenterNet models an object as a single point - the
+  center point of its bounding box and uses keypoint estimation to find center points
+  and regresses to object size. For details see paper <http://arxiv.org/abs/1904.07850>,
+  repository <https://github.com/xingyizhou/CenterNet/>.
+task_type: detection
+files:
+  - name: ctdet_coco_dlav0_384.onnx
+    size: 74027749
+    sha256: 4aabb6d13aa662ef6b7fd3a9fe914e1d133ec621945e6ab19597b624a72604a6
+    source: https://download.01.org/opencv/public_models/122019/ctdet_coco_dlav0/ctdet_coco_dlav0_384.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,384,384]
+  - --input=input.1
+  - --mean_values=input.1[104.04, 113.985, 119.85]
+  - --scale_values=input.1[73.695, 69.87, 70.89]
+  - --output=508,511,514
+  - --input_model=$dl_dir/ctdet_coco_dlav0_384.onnx
+framework: onnx
+license: https://raw.githubusercontent.com/xingyizhou/CenterNet/master/LICENSE
diff --git a/models/public/ctdet_coco_dlav0_384/pytorch-onnx.patch b/models/public/ctdet_coco_dlav0_384/pytorch-onnx.patch
new file mode 100644
index 00000000000..241fbff9ae3
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_384/pytorch-onnx.patch
@@ -0,0 +1,35 @@
+diff --git a/src/convert.py b/src/convert.py
+new file mode 100644
+index 0000000..16888b6
+--- /dev/null
++++ b/src/convert.py
+@@ -0,0 +1,12 @@
++import torch.onnx
++import onnx
++
++import _init_paths
++from opts import opts
++from detectors.detector_factory import detector_factory
++
++opt = opts().init()
++Detector = detector_factory[opt.task]
++detector = Detector(opt)
++input_shape = [1, 3, opt.input_res, opt.input_res]
++torch.onnx.export(detector.model, torch.randn(input_shape), 'ctdet_coco_dlav0_{}.onnx'.format(opt.input_res), export_params=True)
+diff --git a/src/lib/models/networks/dlav0.py b/src/lib/models/networks/dlav0.py
+index 3ff343c..99e2e88 100644
+--- a/src/lib/models/networks/dlav0.py
++++ b/src/lib/models/networks/dlav0.py
+@@ -602,9 +602,9 @@ class DLASeg(nn.Module):
+         x = self.dla_up(x[self.first_level:])
+         # x = self.fc(x)
+         # y = self.softmax(self.up(x))
+-        ret = {}
+-        for head in self.heads:
+-            ret[head] = self.__getattr__(head)(x)
++        ret = []
++        for head in sorted(self.heads.keys()):
++            ret.append(self.__getattr__(head)(x))
+         return [ret]
+ 
+     '''
diff --git a/models/public/ctdet_coco_dlav0_512/ctdet_coco_dlav0_512.md b/models/public/ctdet_coco_dlav0_512/ctdet_coco_dlav0_512.md
new file mode 100644
index 00000000000..c00ed236a3b
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_512/ctdet_coco_dlav0_512.md
@@ -0,0 +1,113 @@
+# ctdet_coco_dlav0_512
+
+## Use Case and High-Level Description
+
+CenterNet object detection model `ctdet_coco_dlav0_512` originally trained on PyTorch\*
+then converted to ONNX\* format. CenterNet models an object as a single point - the center point of its bounding box
+and uses keypoint estimation to find center points and regresses to object size.
+For details see [paper](http://arxiv.org/abs/1904.07850), [repository](https://github.com/xingyizhou/CenterNet/).
+
+### Steps to Reproduce PyTorch to ONNX Conversion
+Model is provided in ONNX format, which was obtained by the following steps.
+
+1. Clone the original repository
+```sh
+git clone https://github.com/xingyizhou/CenterNet
+cd CenterNet
+```
+2. Checkout the commit that the conversion was tested on:
+```sh
+git checkout 8ef87b4
+```
+3. Apply the `pytorch-onnx.patch` patch
+```sh
+git apply /path/to/pytorch-onnx.patch
+```
+4. Follow the original [installation steps](https://github.com/xingyizhou/CenterNet/blob/8ef87b4/readme/INSTALL.md)
+5. Download the [pretrained weights](https://drive.google.com/open?id=18yBxWOlhTo32_swSug_HM4q3BeWgxp_N)
+6. Run
+```sh
+python convert.py ctdet --load_model /path/to/downloaded/weights.pth --exp_id coco_dlav0_512 --arch dlav0_34 --input_res 512 --gpus -1
+```
+
+## Example
+
+## Specification
+
+| Metric                          | Value                                     |
+|---------------------------------|-------------------------------------------|
+| Type                            | Classification                            |
+| GFlops                          | 62.211                                    |
+| MParams                         | 17.911                                    |
+| Source framework                | PyTorch\*                                 |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| MAP    | 44.2           | 44.2            |
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name: `input.1`, shape: [1x3x512x512], format: [BxCxHxW]
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+   Mean values: [104.04, 113.985, 119.85], scale values: [73.695, 69.87, 70.89].
+
+### Converted Model
+
+Image, name: `input.1`, shape: [1x3x512x512], format: [BxCxHxW]
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+
+## Output
+
+1. Object center points heatmap, name: `508`. Contains predicted objects center point, for each of the 80 categories, according to MSCOCO\* dataset version with 80 categories of objects, without background label.
+2. Object size output, name: `511`. Contains predicted width and height for each object.
+3. Regression output, name: `514`. Contains offsets for each prediction.
+
+## Legal Information
+
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/xingyizhou/CenterNet/master/LICENSE)
+
+```
+MIT License
+
+Copyright (c) 2019 Xingyi Zhou
+All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/ctdet_coco_dlav0_512/model.yml b/models/public/ctdet_coco_dlav0_512/model.yml
new file mode 100644
index 00000000000..407dfa27f68
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_512/model.yml
@@ -0,0 +1,35 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  CenterNet object detection model "ctdet_coco_dlav0_512" originally trained on PyTorch*
+  then converted to ONNX* format. CenterNet models an object as a single point - the
+  center point of its bounding box and uses keypoint estimation to find center points
+  and regresses to object size. For details see paper <http://arxiv.org/abs/1904.07850>,
+  repository <https://github.com/xingyizhou/CenterNet/>.
+task_type: detection
+files:
+  - name: ctdet_coco_dlav0_512.onnx
+    size: 74027755
+    sha256: 3b9acf09b197b3c118715d530f5aef4fa0de739d32a1b9b56b16ebb82f0c82b2
+    source: https://download.01.org/opencv/public_models/122019/ctdet_coco_dlav0/ctdet_coco_dlav0_512.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,512,512]
+  - --input=input.1
+  - --mean_values=input.1[104.04, 113.985, 119.85]
+  - --scale_values=input.1[73.695, 69.87, 70.89]
+  - --output=508,511,514
+  - --input_model=$dl_dir/ctdet_coco_dlav0_512.onnx
+framework: onnx
+license: https://raw.githubusercontent.com/xingyizhou/CenterNet/master/LICENSE
diff --git a/models/public/ctdet_coco_dlav0_512/pytorch-onnx.patch b/models/public/ctdet_coco_dlav0_512/pytorch-onnx.patch
new file mode 100644
index 00000000000..241fbff9ae3
--- /dev/null
+++ b/models/public/ctdet_coco_dlav0_512/pytorch-onnx.patch
@@ -0,0 +1,35 @@
+diff --git a/src/convert.py b/src/convert.py
+new file mode 100644
+index 0000000..16888b6
+--- /dev/null
++++ b/src/convert.py
+@@ -0,0 +1,12 @@
++import torch.onnx
++import onnx
++
++import _init_paths
++from opts import opts
++from detectors.detector_factory import detector_factory
++
++opt = opts().init()
++Detector = detector_factory[opt.task]
++detector = Detector(opt)
++input_shape = [1, 3, opt.input_res, opt.input_res]
++torch.onnx.export(detector.model, torch.randn(input_shape), 'ctdet_coco_dlav0_{}.onnx'.format(opt.input_res), export_params=True)
+diff --git a/src/lib/models/networks/dlav0.py b/src/lib/models/networks/dlav0.py
+index 3ff343c..99e2e88 100644
+--- a/src/lib/models/networks/dlav0.py
++++ b/src/lib/models/networks/dlav0.py
+@@ -602,9 +602,9 @@ class DLASeg(nn.Module):
+         x = self.dla_up(x[self.first_level:])
+         # x = self.fc(x)
+         # y = self.softmax(self.up(x))
+-        ret = {}
+-        for head in self.heads:
+-            ret[head] = self.__getattr__(head)(x)
++        ret = []
++        for head in sorted(self.heads.keys()):
++            ret.append(self.__getattr__(head)(x))
+         return [ret]
+ 
+     '''
diff --git a/models/public/ctpn/ctpn.md b/models/public/ctpn/ctpn.md
index f740da564fa..7ca2e9e9650 100644
--- a/models/public/ctpn/ctpn.md
+++ b/models/public/ctpn/ctpn.md
@@ -13,7 +13,7 @@ Detecting Text in Natural Image with Connectionist Text Proposal Network. For de
 | Type                            | Object detection                          |
 | GFlops                          | 55.813                                    |
 | MParams                         | 17.237                                    |
-| Source framework                | Tensorflow\*                              |
+| Source framework                | TensorFlow\*                              |
 
 ## Performance
 
@@ -80,4 +80,29 @@ Image, name: `Placeholder`, shape: [1x3x600x600], format: [BxCxHxW],
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/eragonruan/text-detection-ctpn/banjin-dev/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/eragonruan/text-detection-ctpn/banjin-dev/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2017 shaohui ruan
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/deeplabv3/deeplabv3.md b/models/public/deeplabv3/deeplabv3.md
index 3dcaeedfe36..00cfc6b84f9 100644
--- a/models/public/deeplabv3/deeplabv3.md
+++ b/models/public/deeplabv3/deeplabv3.md
@@ -13,7 +13,7 @@ DeepLab is a state-of-art deep learning model for semantic image segmentation. F
 | Type              | Semantic segmentation|
 | GFLOPs            | 11.469               |
 | MParams           | 23.819               |
-| Source framework  | Tensorflow\*         |
+| Source framework  | TensorFlow\*         |
 
 ## Accuracy
 
@@ -69,4 +69,6 @@ Integer values in a range [0, 20], which represent an index of a predicted class
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/deeplabv3/model.yml b/models/public/deeplabv3/model.yml
index 8d73bf83709..ad50904a1cc 100644
--- a/models/public/deeplabv3/model.yml
+++ b/models/public/deeplabv3/model.yml
@@ -13,8 +13,8 @@
 # limitations under the License.
 
 description: >-
-  DeepLab is a state-of-art deep learning model for semantic image segmentation.
-  For details see paper <https://arxiv.org/pdf/1706.05587.pdf>
+  DeepLab is a state-of-art deep learning model for semantic image segmentation. For
+  details see paper <https://arxiv.org/pdf/1706.05587.pdf>.
 task_type: semantic_segmentation
 files:
   - name: deeplabv3.tar.gz
diff --git a/models/public/densenet-121-caffe2/densenet-121-caffe2.md b/models/public/densenet-121-caffe2/densenet-121-caffe2.md
new file mode 100644
index 00000000000..93e480e3c40
--- /dev/null
+++ b/models/public/densenet-121-caffe2/densenet-121-caffe2.md
@@ -0,0 +1,67 @@
+# densenet-121-caffe2
+
+## Use Case and High-Level Description
+
+This is a Caffe2\* version of `densenet-121` model, one of the DenseNet
+group of models designed to perform image classification. This model
+was converted from Caffe\* to Caffe2\* format. 
+For details see repository <https://github.com/caffe2/models/tree/master/densenet121>,
+paper <https://arxiv.org/pdf/1608.06993.pdf>.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 5.723         |
+| MParams           | 7.971         |
+| Source framework  | Caffe2\*      |
+
+## Accuracy
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`. 
+Mean values - [103.94,116.78,123.68], scale value - 58.8235294.
+
+### Converted model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `fc6`,  shape - `1,1000,1,1`, contains predicted
+probability for each class in logits format.
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `fc6`,  shape - `1,1000,1,1`, contains predicted
+probability for each class in logits format.
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/caffe2/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/densenet-121-caffe2/model.yml b/models/public/densenet-121-caffe2/model.yml
new file mode 100644
index 00000000000..b04d00eafb9
--- /dev/null
+++ b/models/public/densenet-121-caffe2/model.yml
@@ -0,0 +1,44 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This is a Caffe2* version of "densenet-121" model, one of the DenseNet group of
+  models designed to perform image classification. This model was converted from Caffe*
+  to Caffe2* format.  For details see repository <https://github.com/caffe2/models/tree/master/densenet121>,
+  paper <https://arxiv.org/pdf/1608.06993.pdf>.
+task_type: classification
+files:
+  - name: predict_net.pb
+    size: 77239
+    sha256: 820772d4e7b907599cba93ab0e7d2db0dc0b6e313e842a8729a0ea0354e4a719
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/densenet121/predict_net.pb
+  - name: init_net.pb
+    size: 40785727
+    sha256: a3650579bc883a1755750994507c48d84d0f75d193e304eb8caf5031acb5f028
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/densenet121/init_net.pb
+framework: caffe2
+conversion_to_onnx_args:
+  - --model-path=$dl_dir/predict_net.pb
+  - --model-name=densenet-121-caffe2
+  - --weights=$dl_dir/init_net.pb
+  - --input-shape=1,3,224,224
+  - --input-names=data
+  - --output-file=$conv_dir/densenet-121-caffe2.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,224,224]
+  - --input=data
+  - --mean_values=data[103.94,116.78,123.68]
+  - --scale_values=data[58.8235294]
+  - --input_model=$conv_dir/densenet-121-caffe2.onnx
+license: https://raw.githubusercontent.com/caffe2/models/master/LICENSE
diff --git a/models/public/densenet-121-tf/densenet-121-tf.md b/models/public/densenet-121-tf/densenet-121-tf.md
index 149f3da6669..381df0c2846 100644
--- a/models/public/densenet-121-tf/densenet-121-tf.md
+++ b/models/public/densenet-121-tf/densenet-121-tf.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is an Tensorflow\* version of `densenet-121` model, one of the DenseNet\*
+This is a TensorFlow\* version of `densenet-121` model, one of the DenseNet\*
 group of models designed to perform image classification. The weights were converted from DenseNet-Keras Models. For details, see [repository](https://github.com/pudae/tensorflow-densenet/) and [paper](https://arxiv.org/pdf/1608.06993.pdf).
 
 ## Example
@@ -57,4 +57,6 @@ Floating point values in a range [0, 1], which represent probabilities for class
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-DenseNet.txt](../licenses/APACHE-2.0-TF-DenseNet.txt).
diff --git a/models/public/densenet-121-tf/model.yml b/models/public/densenet-121-tf/model.yml
index 0f661025a35..1bcd9ae481e 100644
--- a/models/public/densenet-121-tf/model.yml
+++ b/models/public/densenet-121-tf/model.yml
@@ -13,10 +13,10 @@
 # limitations under the License.
 
 description: >-
-  This is an Tensorflow\* version of `densenet-121` model, one of the DenseNet
-  group of models designed to perform image classification. The weights were converted
-  from DenseNet-Keras Models. For details see repository <https://github.com/pudae/tensorflow-densenet/>,
-  paper <https://arxiv.org/pdf/1608.06993.pdf>
+  This is a TensorFlow* version of "densenet-121" model, one of the DenseNet* group
+  of models designed to perform image classification. The weights were converted from
+  DenseNet-Keras Models. For details, see repository <https://github.com/pudae/tensorflow-densenet/>
+  and paper <https://arxiv.org/pdf/1608.06993.pdf>.
 task_type: classification
 files:
   - name: tf-densenet121.tar.gz
diff --git a/models/public/densenet-121/densenet-121.md b/models/public/densenet-121/densenet-121.md
index 197952abb16..f562648b356 100644
--- a/models/public/densenet-121/densenet-121.md
+++ b/models/public/densenet-121/densenet-121.md
@@ -72,4 +72,35 @@ probability for each class in logits format.
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE):
+
+```
+Copyright (c) 2016, Zhuang Liu.
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+ * Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+ * Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+ * Neither the name DenseNet nor the names of its contributors may be used to
+   endorse or promote products derived from this software without specific
+   prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/densenet-121/model.yml b/models/public/densenet-121/model.yml
index d839e42091b..f7b5ec974bd 100644
--- a/models/public/densenet-121/model.yml
+++ b/models/public/densenet-121/model.yml
@@ -13,19 +13,11 @@
 # limitations under the License.
 
 description: >-
-  The `densenet-121` model is one of the DenseNet <https://arxiv.org/pdf/1608.06993>
-  group of models designed to perform image classification. Originally trained
-  on Torch, the authors converted them into Caffe\* format. All the DenseNet models
-  have been pretrained on the ImageNet image database. For details about this
+  The "densenet-121" model is one of the DenseNet* <https://arxiv.org/pdf/1608.06993>
+  group of models designed to perform image classification. The authors originally
+  trained the models  on Torch*, but then converted them into Caffe* format. All DenseNet
+  models have been pretrained on the ImageNet image database. For details about this
   family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.94, 116.78,
-  123.68] before passing the image blob into the network. In addition, values
-  must be divided by 0.017.
-
-  The model output for `densenet-121` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: densenet-121.prototxt
diff --git a/models/public/densenet-161-tf/densenet-161-tf.md b/models/public/densenet-161-tf/densenet-161-tf.md
index e760973be33..b78a08ce648 100644
--- a/models/public/densenet-161-tf/densenet-161-tf.md
+++ b/models/public/densenet-161-tf/densenet-161-tf.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is an Tensorflow\* version of `densenet-161` model, one of the DenseNet
+This is a TensorFlow\* version of `densenet-161` model, one of the DenseNet
 group of models designed to perform image classification. The weights were converted from DenseNet-Keras Models. For details see [repository](https://github.com/pudae/tensorflow-densenet/), [paper](https://arxiv.org/pdf/1608.06993.pdf).
 
 ## Example
@@ -57,4 +57,6 @@ Floating point values in a range [0, 1], which represent probabilities for class
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-DenseNet.txt](../licenses/APACHE-2.0-TF-DenseNet.txt).
diff --git a/models/public/densenet-161-tf/model.yml b/models/public/densenet-161-tf/model.yml
index 2bdde5d867a..cbd6f104b9e 100644
--- a/models/public/densenet-161-tf/model.yml
+++ b/models/public/densenet-161-tf/model.yml
@@ -13,10 +13,10 @@
 # limitations under the License.
 
 description: >-
-  This is an Tensorflow\* version of `densenet-161` model, one of the DenseNet
-  group of models designed to perform image classification. The weights were converted
-  from DenseNet-Keras Models. For details see repository <https://github.com/pudae/tensorflow-densenet/>,
-  paper <https://arxiv.org/pdf/1608.06993.pdf>
+  This is a TensorFlow* version of "densenet-161" model, one of the DenseNet group
+  of models designed to perform image classification. The weights were converted from
+  DenseNet-Keras Models. For details see repository <https://github.com/pudae/tensorflow-densenet/>,
+  paper <https://arxiv.org/pdf/1608.06993.pdf>.
 task_type: classification
 files:
   - name: tf-densenet161.tar.gz
diff --git a/models/public/densenet-161/densenet-161.md b/models/public/densenet-161/densenet-161.md
index da2fa26a589..4f510740b75 100644
--- a/models/public/densenet-161/densenet-161.md
+++ b/models/public/densenet-161/densenet-161.md
@@ -74,4 +74,35 @@ probability for each class in logits format
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE):
+
+```
+Copyright (c) 2016, Zhuang Liu.
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+ * Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+ * Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+ * Neither the name DenseNet nor the names of its contributors may be used to
+   endorse or promote products derived from this software without specific
+   prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/densenet-161/model.yml b/models/public/densenet-161/model.yml
index c12e36f7a6d..93d715f7d0d 100644
--- a/models/public/densenet-161/model.yml
+++ b/models/public/densenet-161/model.yml
@@ -13,21 +13,21 @@
 # limitations under the License.
 
 description: >-
-  The `densenet-161` model is one of the DenseNet <https://arxiv.org/pdf/1608.06993>
-  group of models designed to perform image classification. The main difference
-  with the `densenet-121` model is the size and accuracy of the model. The `densenet-161`
-  is much larger at 100MB in size vs the `densenet-121` model's roughly 31MB size.
-  Originally trained on Torch, the authors converted them into Caffe* format.
-  All the DenseNet models have been pretrained on the ImageNet image database.
-  For details about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
+  The "densenet-161" model is one of the DenseNet <https://arxiv.org/pdf/1608.06993>
+  group of models designed to perform image classification. The main difference with
+  the "densenet-121" model is the size and accuracy of the model. The "densenet-161"
+  is much larger at 100MB in size vs the "densenet-121" model's roughly 31MB size.
+  Originally trained on Torch, the authors converted them into Caffe* format. All
+  the DenseNet models have been pretrained on the ImageNet image database. For details
+  about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.94, 116.78,
-  123.68] before passing the image blob into the network. In addition, values
-  must be divided by 0.017.
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order. The BGR mean values need to be subtracted as follows: [103.94, 116.78, 123.68]
+  before passing the image blob into the network. In addition, values must be divided
+  by 0.017.
 
-  The model output for `densenet-161` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "densenet-161" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: densenet-161.prototxt
diff --git a/models/public/densenet-169-tf/densenet-169-tf.md b/models/public/densenet-169-tf/densenet-169-tf.md
index db80857209b..59fcffb0f66 100644
--- a/models/public/densenet-169-tf/densenet-169-tf.md
+++ b/models/public/densenet-169-tf/densenet-169-tf.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-This is an Tensorflow\* version of `densenet-169` model, one of the DenseNet
+This is a TensorFlow\* version of `densenet-169` model, one of the DenseNet
 group of models designed to perform image classification. The weights were converted from DenseNet-Keras Models. For details, see [repository](https://github.com/pudae/tensorflow-densenet/) and [paper](https://arxiv.org/pdf/1608.06993.pdf).
 
 ## Example
@@ -56,4 +56,6 @@ Name:`densenet169/predictions/Reshape_1`. Contains floating point values in a ra
 Name: `densenet169/predictions/Reshape_1/Transpose`, shape: [1, 1, 1, 1000]. Contains floating point values in a range [0, 1], which represent probabilities for classes in a dataset.
 
 ## Legal Information
-[https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/pudae/tensorflow-densenet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-DenseNet.txt](../licenses/APACHE-2.0-TF-DenseNet.txt).
diff --git a/models/public/densenet-169-tf/model.yml b/models/public/densenet-169-tf/model.yml
index e9c2c6a5c69..3061073411a 100644
--- a/models/public/densenet-169-tf/model.yml
+++ b/models/public/densenet-169-tf/model.yml
@@ -13,10 +13,10 @@
 # limitations under the License.
 
 description: >-
-  This is an Tensorflow\* version of `densenet-169` model, one of the DenseNet
-  group of models designed to perform image classification. The weights were converted
-  from DenseNet-Keras Models. For details see repository <https://github.com/pudae/tensorflow-densenet/>,
-  paper <https://arxiv.org/pdf/1608.06993.pdf>
+  This is a TensorFlow* version of "densenet-169" model, one of the DenseNet group
+  of models designed to perform image classification. The weights were converted from
+  DenseNet-Keras Models. For details, see repository <https://github.com/pudae/tensorflow-densenet/>
+  and paper <https://arxiv.org/pdf/1608.06993.pdf>.
 task_type: classification
 files:
   - name: tf-densenet169.tar.gz
diff --git a/models/public/densenet-169/densenet-169.md b/models/public/densenet-169/densenet-169.md
index fea0e44512b..ee616e2af4c 100644
--- a/models/public/densenet-169/densenet-169.md
+++ b/models/public/densenet-169/densenet-169.md
@@ -72,6 +72,37 @@ probability for each class in logits format
 Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000,1,1`, contains predicted
 probability for each class in logits format
 
-## License
-
-[https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE]()
+## Legal Information
+
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE):
+
+```
+Copyright (c) 2016, Zhuang Liu.
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+ * Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+ * Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+ * Neither the name DenseNet nor the names of its contributors may be used to
+   endorse or promote products derived from this software without specific
+   prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/densenet-169/model.yml b/models/public/densenet-169/model.yml
index eab1383f807..c272b227c76 100644
--- a/models/public/densenet-169/model.yml
+++ b/models/public/densenet-169/model.yml
@@ -13,21 +13,21 @@
 # limitations under the License.
 
 description: >-
-  The `densenet-169` model is one of the DenseNet <https://arxiv.org/pdf/1608.06993>
-  group of models designed to perform image classification. The main difference
-  with the `densenet-121` model is the size and accuracy of the model. The `densenet-169`
-  is larger at just about 55MB in size vs the `densenet-121` model's roughly 31MB
+  The "densenet-169" model is one of the DenseNet <https://arxiv.org/pdf/1608.06993>
+  group of models designed to perform image classification. The main difference with
+  the "densenet-121" model is the size and accuracy of the model. The "densenet-169"
+  is larger at just about 55MB in size vs the "densenet-121" model's roughly 31MB
   size. Originally trained on Torch, the authors converted them into Caffe* format.
-  All the DenseNet models have been pretrained on the ImageNet image database.
-  For details about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
+  All the DenseNet models have been pretrained on the ImageNet image database. For
+  details about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.94, 116.78,
-  123.68] before passing the image blob into the network. In addition, values
-  must be divided by 0.017.
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order. The BGR mean values need to be subtracted as follows: [103.94, 116.78, 123.68]
+  before passing the image blob into the network. In addition, values must be divided
+  by 0.017.
 
-  The model output for `densenet-169` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "densenet-169" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: densenet-169.prototxt
diff --git a/models/public/densenet-201/densenet-201.md b/models/public/densenet-201/densenet-201.md
index a9770339498..4e912622848 100644
--- a/models/public/densenet-201/densenet-201.md
+++ b/models/public/densenet-201/densenet-201.md
@@ -74,4 +74,35 @@ probability for each class in logits format
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/liuzhuang13/DenseNet/master/LICENSE):
+
+```
+Copyright (c) 2016, Zhuang Liu.
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+ * Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+ * Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+ * Neither the name DenseNet nor the names of its contributors may be used to
+   endorse or promote products derived from this software without specific
+   prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/densenet-201/model.yml b/models/public/densenet-201/model.yml
index 120b29e1244..d3a4828d220 100644
--- a/models/public/densenet-201/model.yml
+++ b/models/public/densenet-201/model.yml
@@ -13,21 +13,21 @@
 # limitations under the License.
 
 description: >-
-  The `densenet-201` model is also one of the DenseNet <https://arxiv.org/pdf/1608.06993>
-  group of models designed to perform image classification. The main difference
-  with the `densenet-121` model is the size and accuracy of the model. The `densenet-201`
-  is larger at over 77MB in size vs the `densenet-121` model's roughly 31MB size.
-  Originally trained on Torch, the authors converted them into Caffe\* format.
-  All the DenseNet models have been pretrained on the ImageNet image database.
-  For details about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
+  The "densenet-201" model is also one of the DenseNet <https://arxiv.org/pdf/1608.06993>
+  group of models designed to perform image classification. The main difference with
+  the "densenet-121" model is the size and accuracy of the model. The "densenet-201"
+  is larger at over 77MB in size vs the "densenet-121" model's roughly 31MB size.
+  Originally trained on Torch, the authors converted them into Caffe* format. All
+  the DenseNet models have been pretrained on the ImageNet image database. For details
+  about this family of models, check out the repository <https://github.com/shicai/DenseNet-Caffe>.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.94, 116.78,
-  123.68] before passing the image blob into the network. In addition, values
-  must be divided by 0.017.
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order. The BGR mean values need to be subtracted as follows: [103.94, 116.78, 123.68]
+  before passing the image blob into the network. In addition, values must be divided
+  by 0.017.
 
-  The model output for `densenet-201` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "densenet-201" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: densenet-201.prototxt
diff --git a/models/public/efficientnet-b0-pytorch/efficientnet-b0-pytorch.md b/models/public/efficientnet-b0-pytorch/efficientnet-b0-pytorch.md
new file mode 100644
index 00000000000..e37253dc37e
--- /dev/null
+++ b/models/public/efficientnet-b0-pytorch/efficientnet-b0-pytorch.md
@@ -0,0 +1,80 @@
+# efficientnet-b0-pytorch
+
+## Use Case and High-Level Description
+
+The `efficientnet-b0-pytorch` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946) models designed to perform image classification. This model was pretrained in PyTorch\*. All the EfficientNet models have been pretrained on the ImageNet image database. For details about this family of models, check out the [EfficientNets for PyTorch repository](https://github.com/rwightman/gen-efficientnet-pytorch).
+
+The model input is a blob that consists of a single image with the [3x224x224] shape in the RGB
+order. Before passing the image blob to the network, do the following:
+1. Subtract the RGB mean values as follows: [123.675,116.28,103.53]
+2. Divide the RGB mean values by  [58.395,57.12,57.375]
+
+The model output for `efficientnet-b0-pytorch` is the typical object classifier output for
+1000 different classifications matching those in the ImageNet database.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 0.819         |
+| MParams           | 5.268         |
+| Source framework  | PyTorch\*     |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 76.91          | 76.91           |
+| Top 5  | 93.21          | 93.21           | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `RGB`.
+Mean values - [123.675,116.28,103.53], scale values - [58.395,57.12,57.375].
+
+### Converted Model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/5e91628ed98250989a7ddd20abfe27385e0493c1/LICENSE).
+A copy of the license is provided in [APACHE-2.0-PyTorch-EfficientNet.txt](../licenses/APACHE-2.0-PyTorch-EfficientNet.txt).
diff --git a/models/public/efficientnet-b0-pytorch/model.yml b/models/public/efficientnet-b0-pytorch/model.yml
new file mode 100644
index 00000000000..d5cf5b0955a
--- /dev/null
+++ b/models/public/efficientnet-b0-pytorch/model.yml
@@ -0,0 +1,73 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b0-pytorch" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>
+  models designed to perform image classification. This model was pretrained in PyTorch*.
+  All the EfficientNet models have been pretrained on the ImageNet image database.
+  For details about this family of models, check out the EfficientNets for PyTorch
+  repository <https://github.com/rwightman/gen-efficientnet-pytorch>.
+
+  The model input is a blob that consists of a single image with the [3x224x224] shape
+  in the RGB order. Before passing the image blob to the network, do the following:
+  1. Subtract the RGB mean values as follows: [123.675,116.28,103.53] 2. Divide the
+  RGB mean values by  [58.395,57.12,57.375]
+
+  The model output for "efficientnet-b0-pytorch" is the typical object classifier
+  output for 1000 different classifications matching those in the ImageNet database.
+task_type: classification
+files:
+  - name: model/gen_efficientnet.py
+    size: 40997
+    sha256: 8613d48ca74611d3566d8c02cbf7c92aad6b16a708ffcf21183a7014fecdec09
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/gen_efficientnet.py
+  - name: model/efficientnet_builder.py
+    size: 18446
+    sha256: 69bb2adc49dc79c8860f36acca910bad6733e23b46ed80551248b90141d5e1b5
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/efficientnet_builder.py
+  - name: model/helpers.py
+    size: 1097
+    sha256: 0415f198b8a87cb34c9f9aed79f267043010fbd197e27df805bab9d070da82ed
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/helpers.py
+  - name: model/conv2d_helpers.py
+    size: 6175
+    sha256: e6ba7e878dd28c6d0ccc9707205bf6b58bea664d7fee820d7101a6a8e48990a9
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/conv2d_helpers.py
+  - name: model/__init__.py
+    size: 32
+    sha256: e0bedda5f5e949b8ace7d4f5cdf80e7e664c0b0a935486b6152078fa61c80c1b
+    source: https://github.com/rwightman/gen-efficientnet-pytorch/raw/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/__init__.py
+  - name: efficientnet-b0.pth
+    size: 21376958
+    sha256: d6904d92f92ccdca67c9717f9d119392d658577f99e5ce021b57d157985783db
+    source: https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-weights/efficientnet_b0-d6904d92.pth
+conversion_to_onnx_args:
+  - --model-path=$dl_dir
+  - --model-name=efficientnet_b0
+  - --import-module=model
+  - --weights=$dl_dir/efficientnet-b0.pth
+  - --input-shape=1,3,224,224
+  - --input-names=data
+  - --output-names=prob
+  - --output-file=$conv_dir/efficientnet-b0.onnx
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,3,224,224]
+  - --input=data
+  - --mean_values=data[123.675,116.28,103.53]
+  - --scale_values=data[58.395,57.12,57.375]
+  - --output=prob
+  - --input_model=$conv_dir/efficientnet-b0.onnx
+framework: pytorch
+license: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/LICENSE
diff --git a/models/public/efficientnet-b0/efficientnet-b0.md b/models/public/efficientnet-b0/efficientnet-b0.md
new file mode 100644
index 00000000000..99f62454f12
--- /dev/null
+++ b/models/public/efficientnet-b0/efficientnet-b0.md
@@ -0,0 +1,75 @@
+# efficientnet-b0
+
+## Use Case and High-Level Description
+
+The `efficientnet-b0` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946) models 
+designed to perform image classification.
+This model was pretrained in TensorFlow\*.
+All the EfficientNet models have been pretrained on the ImageNet\* image database.
+For details about this family of models, check out the [TensorFlow Cloud TPU repository](https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet).
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 0.819         |
+| MParams           | 5.268         |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 75.70          | 75.70           |
+| Top 5  | 92.76          | 92.76           | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `image`,  shape - `[1x224x224x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+
+### Converted Model
+
+Image, name - `sub/placeholder_port_0`,  shape - `[1x224x224x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `logits`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `efficientnet-b0/model/head/dense/MatMul`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-TPU.txt](../licenses/APACHE-2.0-TF-TPU.txt).
diff --git a/models/public/efficientnet-b0/model.yml b/models/public/efficientnet-b0/model.yml
new file mode 100644
index 00000000000..ef0cd62ca38
--- /dev/null
+++ b/models/public/efficientnet-b0/model.yml
@@ -0,0 +1,38 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b0" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>
+  models  designed to perform image classification. This model was pretrained in TensorFlow*.
+  All the EfficientNet models have been pretrained on the ImageNet* image database.
+  For details about this family of models, check out the TensorFlow Cloud TPU repository
+  <https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet>.
+task_type: classification
+files:
+  - name: efficientnet-b0.tar.gz
+    size: 47390720
+    sha256: b82d670255bd48b0a122d571e5766091048a503209caf15e2cda58a41118c613
+    source: https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/ckpts/efficientnet-b0.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: efficientnet-b0.tar.gz
+model_optimizer_args:
+  - --input_shape=[1,224,224,3]
+  - --input=0:sub
+  - --output=logits
+  - --input_meta_graph=$dl_dir/efficientnet-b0/model.ckpt.meta
+  - --reverse_input_channels
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE
diff --git a/models/public/efficientnet-b0_auto_aug/efficientnet-b0_auto_aug.md b/models/public/efficientnet-b0_auto_aug/efficientnet-b0_auto_aug.md
new file mode 100644
index 00000000000..91fd249aa34
--- /dev/null
+++ b/models/public/efficientnet-b0_auto_aug/efficientnet-b0_auto_aug.md
@@ -0,0 +1,76 @@
+# efficientnet-b0_auto_aug
+
+## Use Case and High-Level Description
+
+The `efficientnet-b0_auto_aug` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946)
+models designed to perform image classification, trained with
+[AutoAugmentation preprocessing](https://arxiv.org/abs/1805.09501).
+This model was pretrained in TensorFlow\*.
+All the EfficientNet models have been pretrained on the ImageNet\* image database.
+For details about this family of models, check out the [TensorFlow Cloud TPU repository](https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet).
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 0.819         |
+| MParams           | 5.268         |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 76.43          | 76.43           |
+| Top 5  | 93.04          | 93.04           | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `image`,  shape - `[1x224x224x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+
+### Converted Model
+
+Image, name - `sub/placeholder_port_0`,  shape - `[1x224x224x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `logits`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `efficientnet-b0/model/head/dense/MatMul`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-TPU.txt](../licenses/APACHE-2.0-TF-TPU.txt).
diff --git a/models/public/efficientnet-b0_auto_aug/model.yml b/models/public/efficientnet-b0_auto_aug/model.yml
new file mode 100644
index 00000000000..dd7f43e8fe8
--- /dev/null
+++ b/models/public/efficientnet-b0_auto_aug/model.yml
@@ -0,0 +1,39 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b0_auto_aug" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>
+  models designed to perform image classification, trained with AutoAugmentation preprocessing
+  <https://arxiv.org/abs/1805.09501>. This model was pretrained in TensorFlow*. All
+  the EfficientNet models have been pretrained on the ImageNet* image database. For
+  details about this family of models, check out the TensorFlow Cloud TPU repository
+  <https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet>.
+task_type: classification
+files:
+  - name: efficientnet-b0.tar.gz
+    size: 39302973
+    sha256: c1109c4842c2294d9df2de9fcebc28692d1fe48ff4447e265a5d8e2f74e0fe65
+    source: https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/ckptsaug/efficientnet-b0.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: efficientnet-b0.tar.gz
+model_optimizer_args:
+  - --input_shape=[1,224,224,3]
+  - --input=0:sub
+  - --output=logits
+  - --input_meta_graph=$dl_dir/efficientnet-b0/model.ckpt.meta
+  - --reverse_input_channels
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE
diff --git a/models/public/efficientnet-b5-pytorch/efficientnet-b5-pytorch.md b/models/public/efficientnet-b5-pytorch/efficientnet-b5-pytorch.md
new file mode 100644
index 00000000000..20d6dbe8f61
--- /dev/null
+++ b/models/public/efficientnet-b5-pytorch/efficientnet-b5-pytorch.md
@@ -0,0 +1,82 @@
+# efficientnet-b5-pytorch
+
+## Use Case and High-Level Description
+
+The `efficientnet-b5-pytorch` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946)
+models designed to perform image classification. This model was pretrained in TensorFlow\*, then weights were converted to PyTorch\*. All the EfficientNet models have been pretrained on the ImageNet\* image database. For details about this family of models, check out the [EfficientNets for PyTorch repository](https://github.com/rwightman/gen-efficientnet-pytorch).
+
+
+The model input is a blob that consists of a single image with the [3x456x456] shape in the RGB
+order. Before passing the image blob to the network, do the following:
+1. Subtract the RGB mean values as follows: [123.675,116.28,103.53]
+2. Divide the RGB mean values by  [58.395,57.12,57.375]
+
+The model output for `efficientnet-b5-pytorch` is the typical object classifier output for
+the 1000 different classifications matching those in the ImageNet database.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 21.252        |
+| MParams           | 30.303        |
+| Source framework  | PyTorch\*     |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 83.69          | 83.69           |
+| Top 5  | 96.71          | 96.71           | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `data`,  shape - `1,3,456,456`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `RGB`.
+Mean values - [123.675,116.28,103.53], scale values - [58.395,57.12,57.375].
+
+### Converted Model
+
+Image, name - `data`,  shape - `1,3,456,456`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/5e91628ed98250989a7ddd20abfe27385e0493c1/LICENSE).
+A copy of the license is provided in [APACHE-2.0-PyTorch-EfficientNet.txt](../licenses/APACHE-2.0-PyTorch-EfficientNet.txt).
diff --git a/models/public/efficientnet-b5-pytorch/model.yml b/models/public/efficientnet-b5-pytorch/model.yml
new file mode 100644
index 00000000000..3d70293ef33
--- /dev/null
+++ b/models/public/efficientnet-b5-pytorch/model.yml
@@ -0,0 +1,79 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b5-pytorch" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>
+  models designed to perform image classification. This model was pretrained in TensorFlow*,
+  then weights were converted to PyTorch*. All the EfficientNet models have been pretrained
+  on the ImageNet* image database. For details about this family of models, check
+  out the EfficientNets for PyTorch repository <https://github.com/rwightman/gen-efficientnet-pytorch>.
+
+
+  The model input is a blob that consists of a single image with the [3x456x456] shape
+  in the RGB order. Before passing the image blob to the network, do the following:
+  1. Subtract the RGB mean values as follows: [123.675,116.28,103.53] 2. Divide the
+  RGB mean values by  [58.395,57.12,57.375]
+
+  The model output for "efficientnet-b5-pytorch" is the typical object classifier
+  output for the 1000 different classifications matching those in the ImageNet database.
+task_type: classification
+files:
+  - name: model/gen_efficientnet.py
+    size: 40997
+    sha256: 8613d48ca74611d3566d8c02cbf7c92aad6b16a708ffcf21183a7014fecdec09
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/gen_efficientnet.py
+  - name: model/efficientnet_builder.py
+    size: 18446
+    sha256: 69bb2adc49dc79c8860f36acca910bad6733e23b46ed80551248b90141d5e1b5
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/efficientnet_builder.py
+  - name: model/helpers.py
+    size: 1097
+    sha256: 0415f198b8a87cb34c9f9aed79f267043010fbd197e27df805bab9d070da82ed
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/helpers.py
+  - name: model/conv2d_helpers.py
+    size: 6175
+    sha256: e6ba7e878dd28c6d0ccc9707205bf6b58bea664d7fee820d7101a6a8e48990a9
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/conv2d_helpers.py
+  - name: model/__init__.py
+    size: 32
+    sha256: e0bedda5f5e949b8ace7d4f5cdf80e7e664c0b0a935486b6152078fa61c80c1b
+    source: https://github.com/rwightman/gen-efficientnet-pytorch/raw/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/__init__.py
+  - name: tf-efficientnet-b5.pth
+    size: 122398414
+    sha256: 99018a74e61e5948a955ebfaa2b02ba9abe7bb2e6b7f3d2dfe100e07e103bbdb
+    source: https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-weights/tf_efficientnet_b5_aa-99018a74.pth
+postprocessing:
+  - $type: regex_replace
+    file: model/conv2d_helpers.py
+    pattern: '_EXPORTABLE = False'
+    replacement: '_EXPORTABLE = True'
+conversion_to_onnx_args:
+  - --model-path=$dl_dir
+  - --model-name=tf_efficientnet_b5
+  - --import-module=model
+  - --weights=$dl_dir/tf-efficientnet-b5.pth
+  - --input-shape=1,3,456,456
+  - --input-names=data
+  - --output-names=prob
+  - --output-file=$conv_dir/efficientnet-b5.onnx
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,3,456,456]
+  - --input=data
+  - --mean_values=data[123.675,116.28,103.53]
+  - --scale_values=data[58.395,57.12,57.375]
+  - --output=prob
+  - --input_model=$conv_dir/efficientnet-b5.onnx
+framework: pytorch
+license: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/LICENSE
diff --git a/models/public/efficientnet-b5/efficientnet-b5.md b/models/public/efficientnet-b5/efficientnet-b5.md
new file mode 100644
index 00000000000..808dd67dae9
--- /dev/null
+++ b/models/public/efficientnet-b5/efficientnet-b5.md
@@ -0,0 +1,75 @@
+# efficientnet-b5
+
+## Use Case and High-Level Description
+
+The `efficientnet-b5` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946) 
+models designed to perform image classification.
+This model was pretrained in TensorFlow\*.
+All the EfficientNet models have been pretrained on the ImageNet\* image database.
+For details about this family of models, check out the [TensorFlow Cloud TPU repository](https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet).
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 21.252        |
+| MParams           | 30.303        |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 83.33          | 83.33           |
+| Top 5  | 96.67          | 96.67           |
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `image`,  shape - `[1x456x456x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+
+### Converted Model
+
+Image, name - `sub/placeholder_port_0`,  shape - `[1x456x456x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `logits`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `efficientnet-b5/model/head/dense/MatMul`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-TPU.txt](../licenses/APACHE-2.0-TF-TPU.txt).
diff --git a/models/public/efficientnet-b5/model.yml b/models/public/efficientnet-b5/model.yml
new file mode 100644
index 00000000000..caa133ee0c5
--- /dev/null
+++ b/models/public/efficientnet-b5/model.yml
@@ -0,0 +1,38 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b5" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>  models
+  designed to perform image classification. This model was pretrained in TensorFlow*.
+  All the EfficientNet models have been pretrained on the ImageNet* image database.
+  For details about this family of models, check out the TensorFlow Cloud TPU repository
+  <https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet>.
+task_type: classification
+files:
+  - name: efficientnet-b5.tar.gz
+    size: 255918080
+    sha256: 088c222266c64608da87d8730b3f5bf22da7677fd128357d8040a0389aab338e
+    source: https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/ckpts/efficientnet-b5.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: efficientnet-b5.tar.gz
+model_optimizer_args:
+  - --input_shape=[1,456,456,3]
+  - --input=0:sub
+  - --output=logits
+  - --input_meta_graph=$dl_dir/efficientnet-b5/model.ckpt.meta
+  - --reverse_input_channels
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE
diff --git a/models/public/efficientnet-b7-pytorch/efficientnet-b7-pytorch.md b/models/public/efficientnet-b7-pytorch/efficientnet-b7-pytorch.md
new file mode 100644
index 00000000000..6abbc4453e7
--- /dev/null
+++ b/models/public/efficientnet-b7-pytorch/efficientnet-b7-pytorch.md
@@ -0,0 +1,81 @@
+# efficientnet-b7-pytorch
+
+## Use Case and High-Level Description
+
+The `efficientnet-b7-pytorch` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946) 
+models designed to perform image classification. This model was pretrained in TensorFlow\*, then weights were converted to PyTorch\*. All the EfficientNet models have been pretrained on the ImageNet\* image database. For details about this family of models, check out the [EfficientNets for PyTorch repository](https://github.com/rwightman/gen-efficientnet-pytorch).
+
+The model input is a blob that consists of a single image with the [3x600x600] shape in the RGB
+order. Before passing the image blob to the network, do the following:
+1. Subtract the RGB mean values as follows: [123.675,116.28,103.53]
+2. Divide the RGB mean values by  [58.395,57.12,57.375]
+
+The model output for `efficientnet-b7-pytorch` is the typical object classifier output for
+the 1000 different classifications matching those in the ImageNet database.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 77.618        |
+| MParams           | 66.193        |
+| Source framework  | PyTorch\*     |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 84.42%         | 84.42%          |
+| Top 5  | 96.91%         | 96.91%          | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `data`,  shape - `1,3,600,600`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `RGB`.
+Mean values - [123.675,116.28,103.53], scale values - [58.395,57.12,57.375].
+
+### Converted Model
+
+Image, name - `data`,  shape - `1,3,600,600`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/5e91628ed98250989a7ddd20abfe27385e0493c1/LICENSE).
+A copy of the license is provided in [APACHE-2.0-PyTorch-EfficientNet.txt](../licenses/APACHE-2.0-PyTorch-EfficientNet.txt).
diff --git a/models/public/efficientnet-b7-pytorch/model.yml b/models/public/efficientnet-b7-pytorch/model.yml
new file mode 100644
index 00000000000..271647e395a
--- /dev/null
+++ b/models/public/efficientnet-b7-pytorch/model.yml
@@ -0,0 +1,78 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b7-pytorch" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>  models
+  designed to perform image classification. This model was pretrained in TensorFlow*,
+  then weights were converted to PyTorch*. All the EfficientNet models have been pretrained
+  on the ImageNet* image database. For details about this family of models, check
+  out the EfficientNets for PyTorch repository <https://github.com/rwightman/gen-efficientnet-pytorch>.
+
+  The model input is a blob that consists of a single image with the [3x600x600] shape
+  in the RGB order. Before passing the image blob to the network, do the following:
+  1. Subtract the RGB mean values as follows: [123.675,116.28,103.53] 2. Divide the
+  RGB mean values by  [58.395,57.12,57.375]
+
+  The model output for "efficientnet-b7-pytorch" is the typical object classifier
+  output for the 1000 different classifications matching those in the ImageNet database.
+task_type: classification
+files:
+  - name: model/gen_efficientnet.py
+    size: 40997
+    sha256: 8613d48ca74611d3566d8c02cbf7c92aad6b16a708ffcf21183a7014fecdec09
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/gen_efficientnet.py
+  - name: model/efficientnet_builder.py
+    size: 18446
+    sha256: 69bb2adc49dc79c8860f36acca910bad6733e23b46ed80551248b90141d5e1b5
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/efficientnet_builder.py
+  - name: model/helpers.py
+    size: 1097
+    sha256: 0415f198b8a87cb34c9f9aed79f267043010fbd197e27df805bab9d070da82ed
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/helpers.py
+  - name: model/conv2d_helpers.py
+    size: 6175
+    sha256: e6ba7e878dd28c6d0ccc9707205bf6b58bea664d7fee820d7101a6a8e48990a9
+    source: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/conv2d_helpers.py
+  - name: model/__init__.py
+    size: 32
+    sha256: e0bedda5f5e949b8ace7d4f5cdf80e7e664c0b0a935486b6152078fa61c80c1b
+    source: https://github.com/rwightman/gen-efficientnet-pytorch/raw/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/gen_efficientnet/__init__.py
+  - name: tf-efficientnet-b7.pth
+    size: 266843942
+    sha256: 076e3472fb198ec7c3091aecc73ff205bcca4a114f5862e2297a4c2720c91826
+    source: https://github.com/rwightman/pytorch-image-models/releases/download/v0.1-weights/tf_efficientnet_b7_aa-076e3472.pth
+postprocessing:
+  - $type: regex_replace
+    file: model/conv2d_helpers.py
+    pattern: '_EXPORTABLE = False'
+    replacement: '_EXPORTABLE = True'
+conversion_to_onnx_args:
+  - --model-path=$dl_dir
+  - --model-name=tf_efficientnet_b7
+  - --import-module=model
+  - --weights=$dl_dir/tf-efficientnet-b7.pth
+  - --input-shape=1,3,600,600
+  - --input-names=data
+  - --output-names=prob
+  - --output-file=$conv_dir/efficientnet-b7.onnx
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,3,600,600]
+  - --input=data
+  - --mean_values=data[123.675,116.28,103.53]
+  - --scale_values=data[58.395,57.12,57.375]
+  - --output=prob
+  - --input_model=$conv_dir/efficientnet-b7.onnx
+framework: pytorch
+license: https://raw.githubusercontent.com/rwightman/gen-efficientnet-pytorch/a36e2b2cd1bd122a508a6fffeaa7606890f8c882/LICENSE
diff --git a/models/public/efficientnet-b7_auto_aug/efficientnet-b7_auto_aug.md b/models/public/efficientnet-b7_auto_aug/efficientnet-b7_auto_aug.md
new file mode 100644
index 00000000000..07fa9a04e96
--- /dev/null
+++ b/models/public/efficientnet-b7_auto_aug/efficientnet-b7_auto_aug.md
@@ -0,0 +1,76 @@
+# efficientnet-b7_auto_aug
+
+## Use Case and High-Level Description
+
+The `efficientnet-b7_auto_aug` model is one of the [EfficientNet](https://arxiv.org/abs/1905.11946)
+models designed to perform image classification, trained with the
+[AutoAugmentation preprocessing](https://arxiv.org/abs/1805.09501).
+This model was pretrained in TensorFlow\*.
+All the EfficientNet models have been pretrained on the ImageNet\* image database.
+For details about this family of models, check out the [TensorFlow Cloud TPU repository](https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet).
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 77.618        |
+| MParams           | 66.193        |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 84.68          | 84.68           |
+| Top 5  | 97.09          | 97.09           | 
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name - `image`,  shape - `[1x600x600x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+
+### Converted Model
+
+Image, name - `sub/placeholder_port_0`,  shape - `[1x600x600x3]`, format is `[BxHxWxC]` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name - `logits`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name - `efficientnet-b7/model/head/dense/MatMul`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in the [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TF-TPU.txt](../licenses/APACHE-2.0-TF-TPU.txt).
diff --git a/models/public/efficientnet-b7_auto_aug/model.yml b/models/public/efficientnet-b7_auto_aug/model.yml
new file mode 100644
index 00000000000..cba950cdb9c
--- /dev/null
+++ b/models/public/efficientnet-b7_auto_aug/model.yml
@@ -0,0 +1,39 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The "efficientnet-b7_auto_aug" model is one of the EfficientNet <https://arxiv.org/abs/1905.11946>
+  models designed to perform image classification, trained with the AutoAugmentation
+  preprocessing <https://arxiv.org/abs/1805.09501>. This model was pretrained in TensorFlow*.
+  All the EfficientNet models have been pretrained on the ImageNet* image database.
+  For details about this family of models, check out the TensorFlow Cloud TPU repository
+  <https://github.com/tensorflow/tpu/tree/master/models/official/efficientnet>.
+task_type: classification
+files:
+  - name: efficientnet-b7.tar.gz
+    size: 492077218
+    sha256: b5705cc53da6fa3e953f8509063695ed50f7adebb2488144783e20df71d0fca8
+    source: https://storage.googleapis.com/cloud-tpu-checkpoints/efficientnet/ckptsaug/efficientnet-b7.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: efficientnet-b7.tar.gz
+model_optimizer_args:
+  - --input_shape=[1,600,600,3]
+  - --input=0:sub
+  - --output=logits
+  - --input_meta_graph=$dl_dir/efficientnet-b7/model.ckpt.meta
+  - --reverse_input_channels
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/tpu/master/LICENSE
diff --git a/models/public/face-detection-retail-0044/face-detection-retail-0044.md b/models/public/face-detection-retail-0044/face-detection-retail-0044.md
new file mode 100644
index 00000000000..6e063de08e7
--- /dev/null
+++ b/models/public/face-detection-retail-0044/face-detection-retail-0044.md
@@ -0,0 +1,88 @@
+# face-detection-retail-0044
+
+## Use Case and High-Level Description
+
+Face detector based on SqueezeNet light (half-channels) as a backbone with a
+single SSD for indoor/outdoor scenes shot by a front-facing camera. The backbone
+consists of fire modules to reduce the number of computations. The single SSD
+head from 1/16 scale feature map has nine clustered prior boxes.
+
+## Example
+
+![](./face-detection-retail-0044.png)
+
+## Specification
+
+| Metric                                                        | Value                   |
+|---------------------------------------------------------------|-------------------------|
+| AP ([WIDER](http://shuoyang1213.me/WIDERFACE/))               | 83.00%                  |
+| GFlops                                                        | 1.067                   |
+| MParams                                                       | 0.588                   |
+| Source framework                                              | Caffe*                  |
+
+Average Precision (AP) is defined as an area under the
+[precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall)
+curve. All numbers were evaluated by taking into account only faces bigger than
+60 x 60 pixels.
+
+## Performance
+
+## Inputs
+
+### Original Model
+
+Image, name: `input` , shape: `1,3,300,300`, format `B,C,H,W` where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+Expected color order - BGR.
+
+### Converted Model
+
+Image, name: `input` , shape: `1,3,300,300`, format `B,C,H,W` where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+Expected color order - BGR.
+
+## Outputs
+
+### Original Model
+
+The net outputs a blob with shape: `1,1,N,7`, where N is the number of detected
+bounding boxes. For each detection, the description has the format:
+[`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`],
+where:
+
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner.
+
+### Converted Model
+
+The net outputs a blob with shape: `1,1,N,7`, where N is the number of detected
+bounding boxes. For each detection, the description has the format:
+[`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`],
+where:
+
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner.
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/opencv/training_toolbox_caffe/develop/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
+
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/face-detection-retail-0044/face-detection-retail-0044.png b/models/public/face-detection-retail-0044/face-detection-retail-0044.png
new file mode 100644
index 00000000000..a81877c2eda
Binary files /dev/null and b/models/public/face-detection-retail-0044/face-detection-retail-0044.png differ
diff --git a/models/public/face-detection-retail-0044/model.yml b/models/public/face-detection-retail-0044/model.yml
index 84d862c0c31..d60c99d91e7 100644
--- a/models/public/face-detection-retail-0044/model.yml
+++ b/models/public/face-detection-retail-0044/model.yml
@@ -12,7 +12,11 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-description: Face Detection (SqNet1.0modif+single scale) with BatchNormalization trained with negatives
+description: >-
+  Face detector based on SqueezeNet light (half-channels) as a backbone with a single
+  SSD for indoor/outdoor scenes shot by a front-facing camera. The backbone consists
+  of fire modules to reduce the number of computations. The single SSD head from 1/16
+  scale feature map has nine clustered prior boxes.
 task_type: detection
 files:
   - name: face-detection-retail-0044.prototxt
diff --git a/models/public/face-recognition-mobilefacenet-arcface/face-recognition-mobilefacenet-arcface.md b/models/public/face-recognition-mobilefacenet-arcface/face-recognition-mobilefacenet-arcface.md
index a1112775717..bdf2b01b088 100644
--- a/models/public/face-recognition-mobilefacenet-arcface/face-recognition-mobilefacenet-arcface.md
+++ b/models/public/face-recognition-mobilefacenet-arcface/face-recognition-mobilefacenet-arcface.md
@@ -49,22 +49,47 @@ Channel order is `BGR`.
 
 ### Original Model
 
-Face embedings, name: `pre_fc1`,  shape: `1,512`, output data format: `B,C`, where:
+Face embeddings, name: `pre_fc1`,  shape: `1,128`, output data format: `B,C`, where:
 
 - `B` - batch size
-- `C` - row-vector of 512 floating points values, face embeddings
+- `C` - row-vector of 128 floating points values, face embeddings
 
 The net outputs on different images are comparable in cosine distance.
 
 ### Converted Model
 
-Face embeddings, name: `pre_fc1`,  shape: `1,512`, output data format: `B,C`, where:
+Face embeddings, name: `pre_fc1`,  shape: `1,128`, output data format: `B,C`, where:
 
 - `B` - batch size
-- `C` - row-vector of 512 floating points values, face embeddings
+- `C` - row-vector of 128 floating points values, face embeddings
 
 The net outputs on different images are comparable in cosine distance.
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2018 Jiankang Deng and Jia Guo
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/face-recognition-mobilefacenet-arcface/model.yml b/models/public/face-recognition-mobilefacenet-arcface/model.yml
index b471c399cb3..13f11d4e38d 100644
--- a/models/public/face-recognition-mobilefacenet-arcface/model.yml
+++ b/models/public/face-recognition-mobilefacenet-arcface/model.yml
@@ -13,7 +13,7 @@
 # limitations under the License.
 
 description: >-
-  Deep face recognition net with MobileFaceNet architecture and Arcface loss <https://arxiv.org/abs/1801.07698>
+  Deep face recognition net with MobileFaceNet backbone and Arcface loss <https://arxiv.org/abs/1801.07698>
 task_type: face_recognition
 files:
   - name: model-MobileFaceNet-arcface-ms1m-refine-v1.zip
diff --git a/models/public/face-recognition-resnet100-arcface/face-recognition-resnet100-arcface.md b/models/public/face-recognition-resnet100-arcface/face-recognition-resnet100-arcface.md
index 165e4790816..88138ce106c 100644
--- a/models/public/face-recognition-resnet100-arcface/face-recognition-resnet100-arcface.md
+++ b/models/public/face-recognition-resnet100-arcface/face-recognition-resnet100-arcface.md
@@ -67,4 +67,29 @@ The net outputs on different images are comparable in cosine distance.
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2018 Jiankang Deng and Jia Guo
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/face-recognition-resnet100-arcface/model.yml b/models/public/face-recognition-resnet100-arcface/model.yml
index c3a87d0d91f..8aad33fac2e 100644
--- a/models/public/face-recognition-resnet100-arcface/model.yml
+++ b/models/public/face-recognition-resnet100-arcface/model.yml
@@ -17,7 +17,7 @@ description: >-
 task_type: face_recognition
 files:
   - name: model-r100-arcface-ms1m-refine-v2.zip
-    size: 162345348
+    size: 243494890
     sha256: eab0e5bcca81c070f56ffb11a1c32d7b2e574a8bb94f32590e7b48b355c13d1f
     source: https://www.dropbox.com/s/tj96fsm6t6rq8ye/model-r100-arcface-ms1m-refine-v2.zip?dl=1
 postprocessing:
diff --git a/models/public/face-recognition-resnet34-arcface/face-recognition-resnet34-arcface.md b/models/public/face-recognition-resnet34-arcface/face-recognition-resnet34-arcface.md
index 8960c5992c7..be17bca0dd1 100644
--- a/models/public/face-recognition-resnet34-arcface/face-recognition-resnet34-arcface.md
+++ b/models/public/face-recognition-resnet34-arcface/face-recognition-resnet34-arcface.md
@@ -67,4 +67,29 @@ The net outputs on different images are comparable in cosine distance.
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2018 Jiankang Deng and Jia Guo
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/face-recognition-resnet50-arcface/face-recognition-resnet50-arcface.md b/models/public/face-recognition-resnet50-arcface/face-recognition-resnet50-arcface.md
index a581a2a0118..21e25745b49 100644
--- a/models/public/face-recognition-resnet50-arcface/face-recognition-resnet50-arcface.md
+++ b/models/public/face-recognition-resnet50-arcface/face-recognition-resnet50-arcface.md
@@ -67,4 +67,29 @@ The net outputs on different images are comparable in cosine distance.
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/deepinsight/insightface/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2018 Jiankang Deng and Jia Guo
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/facenet-20180408-102900/facenet-20180408-102900.md b/models/public/facenet-20180408-102900/facenet-20180408-102900.md
index 8171a6369ee..80310187cef 100644
--- a/models/public/facenet-20180408-102900/facenet-20180408-102900.md
+++ b/models/public/facenet-20180408-102900/facenet-20180408-102900.md
@@ -61,4 +61,29 @@ Face embeddings, name - `InceptionResnetV1/Bottleneck/BatchNorm/Reshape_1/Normal
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/davidsandberg/facenet/master/LICENSE.md]()
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/davidsandberg/facenet/master/LICENSE.md):
+
+```
+MIT License
+
+Copyright (c) 2016 David Sandberg
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/facenet-20180408-102900/model.yml b/models/public/facenet-20180408-102900/model.yml
index 83432ce96b5..25d5aab0e64 100644
--- a/models/public/facenet-20180408-102900/model.yml
+++ b/models/public/facenet-20180408-102900/model.yml
@@ -13,8 +13,8 @@
 # limitations under the License.
 
 description: >-
-  FaceNet: A Unified Embedding for Face Recognition and Clustering. For details
-  see repository <https://github.com/davidsandberg/facenet/>, paper <https://arxiv.org/pdf/1503.03832.pdf>
+  FaceNet: A Unified Embedding for Face Recognition and Clustering. For details see
+  the repository <https://github.com/davidsandberg/facenet/>, paper <https://arxiv.org/pdf/1503.03832.pdf>
 task_type: face_recognition
 files:
   - name: 20180408-102900.zip
diff --git a/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/faster_rcnn_inception_resnet_v2_atrous_coco.md b/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/faster_rcnn_inception_resnet_v2_atrous_coco.md
index d2f001143ad..9cfffc5cff8 100644
--- a/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/faster_rcnn_inception_resnet_v2_atrous_coco.md
+++ b/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/faster_rcnn_inception_resnet_v2_atrous_coco.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-Faster R-CNN with Inception Resnet v2 Atrous version. Used for object detection. For details see the [paper](https://arxiv.org/pdf/1801.04381.pdf).
+Faster R-CNN with Inception Resnet v2 Atrous version. Used for object detection. For details see the [paper](https://arxiv.org/pdf/1506.01497v3.pdf).
 
 ## Example
 
@@ -21,7 +21,7 @@ Faster R-CNN with Inception Resnet v2 Atrous version. Used for object detection.
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x600x1024x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x600x600], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x600x1024], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -73,4 +73,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/model.yml b/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/model.yml
index 97ae3a7a271..9c7d2d05525 100644
--- a/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/model.yml
+++ b/models/public/faster_rcnn_inception_resnet_v2_atrous_coco/model.yml
@@ -14,7 +14,7 @@
 
 description: >-
   Faster R-CNN with Inception Resnet v2 Atrous version. Used for object detection.
-  For details see paper <https://arxiv.org/pdf/1801.04381.pdf>.
+  For details see the paper <https://arxiv.org/pdf/1506.01497v3.pdf>.
 task_type: detection
 files:
   - name: faster_rcnn_inception_resnet_v2_atrous_coco_2018_01_28.tar.gz
@@ -27,9 +27,9 @@ postprocessing:
     file: faster_rcnn_inception_resnet_v2_atrous_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,600,600,3]
+  - --input_shape=[1,600,1024,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/faster_rcnn_inception_resnet_v2_atrous_coco_2018_01_28/pipeline.config
   - --output=detection_scores,detection_boxes,num_detections
   - --input_model=$dl_dir/faster_rcnn_inception_resnet_v2_atrous_coco_2018_01_28/frozen_inference_graph.pb
diff --git a/models/public/faster_rcnn_inception_v2_coco/faster_rcnn_inception_v2_coco.md b/models/public/faster_rcnn_inception_v2_coco/faster_rcnn_inception_v2_coco.md
index 743b57b8872..4d884f9a27e 100644
--- a/models/public/faster_rcnn_inception_v2_coco/faster_rcnn_inception_v2_coco.md
+++ b/models/public/faster_rcnn_inception_v2_coco/faster_rcnn_inception_v2_coco.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-Faster R-CNN with Inception v2. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1801.04381.pdf).
+Faster R-CNN with Inception v2. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1506.01497v3.pdf).
 
 ## Example
 
@@ -21,7 +21,7 @@ Faster R-CNN with Inception v2. Used for object detection. For details, see the
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x600x1024x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x600x600], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x600x1024], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -73,4 +73,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/faster_rcnn_inception_v2_coco/model.yml b/models/public/faster_rcnn_inception_v2_coco/model.yml
index edf3d69478a..3b87e9e4a63 100644
--- a/models/public/faster_rcnn_inception_v2_coco/model.yml
+++ b/models/public/faster_rcnn_inception_v2_coco/model.yml
@@ -13,8 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Faster R-CNN with Inception v2. Used for object detection. For details see paper
-  <https://arxiv.org/pdf/1801.04381.pdf>.
+  Faster R-CNN with Inception v2. Used for object detection. For details, see the
+  paper <https://arxiv.org/pdf/1506.01497v3.pdf>.
 task_type: detection
 files:
   - name: faster_rcnn_inception_v2_coco.tar.gz
@@ -27,10 +27,10 @@ postprocessing:
     file: faster_rcnn_inception_v2_coco.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,600,600,3]
+  - --input_shape=[1,600,1024,3]
   - --input=image_tensor
   - --output=detection_scores,detection_boxes,num_detections
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/faster_rcnn_inception_v2_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/faster_rcnn_inception_v2_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/faster_rcnn_resnet101_coco/faster_rcnn_resnet101_coco.md b/models/public/faster_rcnn_resnet101_coco/faster_rcnn_resnet101_coco.md
index f3ae717c0a8..db38fc4ef9c 100644
--- a/models/public/faster_rcnn_resnet101_coco/faster_rcnn_resnet101_coco.md
+++ b/models/public/faster_rcnn_resnet101_coco/faster_rcnn_resnet101_coco.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-Faster R-CNN Resnet-101 model. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1801.04381.pdf).
+Faster R-CNN Resnet-101 model. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1506.01497v3.pdf).
 
 ## Example
 
@@ -21,7 +21,7 @@ Faster R-CNN Resnet-101 model. Used for object detection. For details, see the [
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x600x1024x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x600x600], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x600x1024], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -73,4 +73,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/faster_rcnn_resnet101_coco/model.yml b/models/public/faster_rcnn_resnet101_coco/model.yml
index c547967cf20..6b4cf545ca8 100644
--- a/models/public/faster_rcnn_resnet101_coco/model.yml
+++ b/models/public/faster_rcnn_resnet101_coco/model.yml
@@ -13,8 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Faster R-CNN Resnet-101 model. Used for object detection. For details see paper
-  <https://arxiv.org/pdf/1801.04381.pdf>.
+  Faster R-CNN Resnet-101 model. Used for object detection. For details, see the paper
+  <https://arxiv.org/pdf/1506.01497v3.pdf>.
 task_type: detection
 files:
   - name: faster_rcnn_resnet101_coco.tar.gz
@@ -27,10 +27,10 @@ postprocessing:
     file: faster_rcnn_resnet101_coco.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,600,600,3]
+  - --input_shape=[1,600,1024,3]
   - --input=image_tensor
   - --output=detection_scores,detection_boxes,num_detections
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/faster_rcnn_resnet101_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/faster_rcnn_resnet101_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/faster_rcnn_resnet50_coco/faster_rcnn_resnet50_coco.md b/models/public/faster_rcnn_resnet50_coco/faster_rcnn_resnet50_coco.md
index b1d2d9a886a..adee5b45b49 100644
--- a/models/public/faster_rcnn_resnet50_coco/faster_rcnn_resnet50_coco.md
+++ b/models/public/faster_rcnn_resnet50_coco/faster_rcnn_resnet50_coco.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-Faster R-CNN Resnet-50 model. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1801.04381.pdf).
+Faster R-CNN Resnet-50 model. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1506.01497v3.pdf).
 
 ## Example
 
@@ -21,7 +21,7 @@ Faster R-CNN Resnet-50 model. Used for object detection. For details, see the [p
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x600x1024x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x600x600], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x600x1024], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -73,4 +73,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/faster_rcnn_resnet50_coco/model.yml b/models/public/faster_rcnn_resnet50_coco/model.yml
index 4e793b62271..ca4bb3b5fa9 100644
--- a/models/public/faster_rcnn_resnet50_coco/model.yml
+++ b/models/public/faster_rcnn_resnet50_coco/model.yml
@@ -13,8 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Faster R-CNN Resnet-50 model. Used for object detection. For details see paper
-  <https://arxiv.org/pdf/1801.04381.pdf>.
+  Faster R-CNN Resnet-50 model. Used for object detection. For details, see the paper
+  <https://arxiv.org/pdf/1506.01497v3.pdf>.
 task_type: detection
 files:
   - name: faster_rcnn_resnet50_coco_2018_01_28.tar.gz
@@ -27,9 +27,9 @@ postprocessing:
     file: faster_rcnn_resnet50_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,600,600,3]
+  - --input_shape=[1,600,1024,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/faster_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/faster_rcnn_resnet50_coco_2018_01_28/pipeline.config
   - --output=detection_scores,detection_boxes,num_detections
   - --input_model=$dl_dir/faster_rcnn_resnet50_coco_2018_01_28/frozen_inference_graph.pb
diff --git a/models/public/googlenet-v1-tf/freeze.py.patch b/models/public/googlenet-v1-tf/freeze.py.patch
new file mode 100644
index 00000000000..693e86bb7f4
--- /dev/null
+++ b/models/public/googlenet-v1-tf/freeze.py.patch
@@ -0,0 +1,56 @@
+diff --git a/research/slim/freeze.py b/research/slim/freeze.py
+new file mode 100644
+index 0000000..411001d
+--- /dev/null
++++ b/research/slim/freeze.py
+@@ -0,0 +1,62 @@
++import argparse
++import os
++import tensorflow as tf
++from tensorflow.python.framework import graph_io
++
++from nets import nets_factory
++
++def parse_args():
++    """Parse input arguments"""
++
++    parser = argparse.ArgumentParser(description='Freeze models from TF Slim')
++
++    parser.add_argument('--ckpt', type=str, required=True,
++                        help='Path to .ckpt file')
++    parser.add_argument('--name', type=str, required=True,
++                        help='Model name')
++    parser.add_argument('--num_classes', type=int, required=True,
++                        help='Number of classes')
++    parser.add_argument('--output', type=str, required=True,
++                        help='Name of output node')
++    return parser.parse_args()
++
++def convert(model_name, ckpt, num_classes, output=None):
++    tf.logging.set_verbosity(tf.logging.INFO)
++
++    with tf.Graph().as_default() as graph, tf.Session() as sess:
++        network_fn = nets_factory.get_network_fn(model_name, num_classes=num_classes, is_training=False)
++
++        size = network_fn.default_image_size
++        placeholder = tf.placeholder(name='input', dtype=tf.float32, shape=(1, size, size, 3))
++        network_fn(placeholder)
++
++        frozen = ckpt.replace('ckpt', 'frozen.pb')
++
++        tf.train.Saver().restore(sess, ckpt)
++        frozen_graph_def = tf.graph_util.convert_variables_to_constants(
++            sess, graph.as_graph_def(), [output])
++
++        print('Writing {}'.format(frozen))
++        graph_io.write_graph(frozen_graph_def, os.path.dirname(frozen), frozen, as_text=False)
++
++def main():
++    args = parse_args()
++    convert(args.name, args.ckpt, args.num_classes, args.output)
++
++    print('Done')
++
++
++if __name__ == '__main__':
++    main()
diff --git a/models/public/googlenet-v1-tf/googlenet-v1-tf.md b/models/public/googlenet-v1-tf/googlenet-v1-tf.md
new file mode 100644
index 00000000000..087fed2e175
--- /dev/null
+++ b/models/public/googlenet-v1-tf/googlenet-v1-tf.md
@@ -0,0 +1,100 @@
+# googlenet-v1-tf
+
+## Use Case and High-Level Description
+
+The `googlenet-v1-tf` model is one of the Inception family, designed to perform image classification.
+Like the other Inception models, the `googlenet-v1-tf` model has been pretrained on the ImageNet image database.
+Originally redistributed as a checkpoint file, was converted to frozen graph.
+For details about this family of models, check out the [paper](https://arxiv.org/pdf/1602.07261.pdf), [repository](https://github.com/tensorflow/models/tree/master/research/slim).
+
+### Steps to Reproduce Conversion to Frozen Graph
+
+1. Clone the original repository
+```sh
+git clone https://github.com/tensorflow/models.git
+cd models/research/slim
+```
+2. Checkout the commit that the conversion was tested on:
+```sh
+git checkout 5d36f19
+```
+3. Apply `freeze.py.patch` patch
+```sh
+git apply path/to/freeze.py.patch
+```
+4. Download the [pretrained weights](http://download.tensorflow.org/models/inception_v1_2016_08_28.tar.gz)
+5. Install the dependencies:
+```sh
+pip install tensorflow==1.14.0
+```
+6. Run
+```sh
+python3 freeze.py --ckpt path/to/inception_v1.ckpt --name inception_v1 --num_classes 1001 --output InceptionV1/Logits/Predictions/Softmax
+```
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 3.016         |
+| MParams           | 6.619         |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 69.81          | 69.81           |
+| Top 5  | 89.61          | 89.61           |
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `input`, shape - `1,224,224,3`, format is `B,H,W,C` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+Mean values - [127.5, 127.5, 127.5], scale value - 127.5
+
+### Converted model
+
+Image,  name - `data`, shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `InceptionV1/Logits/Predictions/Softmax`,  shape - `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `InceptionV1/Logits/Predictions/Softmax`,  shape - `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://github.com/tensorflow/models/blob/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/googlenet-v1-tf/model.yml b/models/public/googlenet-v1-tf/model.yml
new file mode 100644
index 00000000000..2ee1f51d6d4
--- /dev/null
+++ b/models/public/googlenet-v1-tf/model.yml
@@ -0,0 +1,35 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The `googlenet-v1-tf` model is one of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  family, designed to perform image classification. Like the other Inception
+  models, the `googlenet-v1-tf` model has been pretrained on the ImageNet image database.
+  For details about this family of models, check out the paper.
+task_type: classification
+files:
+  - name: inception_v1.frozen.pb
+    size: 26735789
+    sha256: 5098978b1c82717bb4d1702b200d715f6e1e37121fdf51795ff5d8a228a26485
+    source: https://download.01.org/opencv/public_models/012020/googlenet-v1-tf/inception_v1.frozen.pb
+model_optimizer_args:
+  - --input_shape=[1,224,224,3]
+  - --input=input
+  - --mean_values=input[127.5,127.5,127.5]
+  - --scale_values=input[127.5]
+  - --output=InceptionV1/Logits/Predictions/Softmax
+  - --input_model=$dl_dir/inception_v1.frozen.pb
+  - --reverse_input_channels
+framework: tf
+license: https://github.com/tensorflow/models/blob/master/LICENSE
diff --git a/models/public/googlenet-v1/googlenet-v1.md b/models/public/googlenet-v1/googlenet-v1.md
index fda7a48d494..10a5f8abb3f 100644
--- a/models/public/googlenet-v1/googlenet-v1.md
+++ b/models/public/googlenet-v1/googlenet-v1.md
@@ -68,4 +68,9 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/BVLC/caffe/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_googlenet/readme.md):
+
+```
+This model is released for unrestricted use.
+```
diff --git a/models/public/googlenet-v1/model.yml b/models/public/googlenet-v1/model.yml
index 2b23423bd85..0b62e02536e 100644
--- a/models/public/googlenet-v1/model.yml
+++ b/models/public/googlenet-v1/model.yml
@@ -13,17 +13,17 @@
 # limitations under the License.
 
 description: >-
-  The `googlenet-v1` model is the first of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  The "googlenet-v1" model is the first of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
   family of models designed to perform image classification. Like the other Inception
-  models, the `googlenet-v1` model has been pretrained on the ImageNet image database.
+  models, the "googlenet-v1" model has been pretrained on the ImageNet image database.
   For details about this family of models, check out the paper.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order.  The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order.  The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
   before passing the image blob into the network.
 
-  The model output for `googlenet-v1` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "googlenet-v1" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: googlenet-v1.prototxt
@@ -47,4 +47,4 @@ model_optimizer_args:
   - --input_model=$dl_dir/googlenet-v1.caffemodel
   - --input_proto=$dl_dir/googlenet-v1.prototxt
 framework: caffe
-license: https://raw.githubusercontent.com/BVLC/caffe/master/LICENSE
+license: https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_googlenet/readme.md
diff --git a/models/public/googlenet-v2/googlenet-v2.md b/models/public/googlenet-v2/googlenet-v2.md
index ac092354a72..6280a1fb058 100644
--- a/models/public/googlenet-v2/googlenet-v2.md
+++ b/models/public/googlenet-v2/googlenet-v2.md
@@ -68,4 +68,9 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/lim0606/caffe-googlenet-bn/master/README.md]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/lim0606/caffe-googlenet-bn/master/README.md):
+
+```
+This model is released for unrestricted use.
+```
diff --git a/models/public/googlenet-v2/model.yml b/models/public/googlenet-v2/model.yml
index 5bca7c06001..3db997234d7 100644
--- a/models/public/googlenet-v2/model.yml
+++ b/models/public/googlenet-v2/model.yml
@@ -13,17 +13,17 @@
 # limitations under the License.
 
 description: >-
-  The `googlenet-v2` model is the second of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  The "googlenet-v2" model is the second of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
   family of models designed to perform image classification. Like the other Inception
-  models, the `googlenet-v2` model has been pretrained on the ImageNet image database.
+  models, the "googlenet-v2" model has been pretrained on the ImageNet image database.
   For details about this family of models, check out the paper.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order. The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
   before passing the image blob into the network.
 
-  The model output for `googlenet-v2` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "googlenet-v2" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: googlenet-v2.prototxt
diff --git a/models/public/googlenet-v3-pytorch/googlenet-v3-pytorch.md b/models/public/googlenet-v3-pytorch/googlenet-v3-pytorch.md
index 86695b1c86d..29aefa8a567 100644
--- a/models/public/googlenet-v3-pytorch/googlenet-v3-pytorch.md
+++ b/models/public/googlenet-v3-pytorch/googlenet-v3-pytorch.md
@@ -65,4 +65,37 @@ Object classifier according to ImageNet classes, name - `prob`, shape - [1,1000]
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/pytorch/vision/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/pytorch/vision/master/LICENSE):
+
+```
+BSD 3-Clause License
+
+Copyright (c) Soumith Chintala 2016,
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/googlenet-v3-pytorch/model.yml b/models/public/googlenet-v3-pytorch/model.yml
index e0c98fb22e1..596d9bc3f67 100644
--- a/models/public/googlenet-v3-pytorch/model.yml
+++ b/models/public/googlenet-v3-pytorch/model.yml
@@ -14,12 +14,12 @@
 
 description: >-
   Inception v3 is image classification model pretrained on ImageNet dataset. This
-  PyTorch implementation of architecture described in the paper "Rethinking the
-  Inception Architecture for Computer Vision" <https://arxiv.org/pdf/1512.00567.pdf>
-  in TorchVision package (see here <https://github.com/pytorch/vision>).
+  PyTorch implementation of architecture described in the paper "Rethinking the Inception
+  Architecture for Computer Vision" <https://arxiv.org/pdf/1512.00567.pdf> in TorchVision
+  package (see here <https://github.com/pytorch/vision>).
 
-  The model input is a blob that consists of a single image of "1x3x299x299" in
-  RGB order.
+  The model input is a blob that consists of a single image of "1x3x299x299" in RGB
+  order. 
 
   The model output is typical object classifier for the 1000 different classifications
   matching with those in the ImageNet database.
@@ -30,7 +30,7 @@ files:
     size: 108857766
     source: https://download.pytorch.org/models/inception_v3_google-1a9a5a14.pth
 framework: pytorch
-pytorch_to_onnx:
+conversion_to_onnx_args:
   - --model-name=inception_v3
   - --weights=$dl_dir/inception_v3_google-1a9a5a14.pth
   - --from-torchvision
diff --git a/models/public/googlenet-v3/googlenet-v3.md b/models/public/googlenet-v3/googlenet-v3.md
index 99a1db1c090..3dd8d912197 100644
--- a/models/public/googlenet-v3/googlenet-v3.md
+++ b/models/public/googlenet-v3/googlenet-v3.md
@@ -55,4 +55,6 @@ Object classifier according to ImageNet classes, name: `InceptionV3/Predictions/
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/googlenet-v3/model.yml b/models/public/googlenet-v3/model.yml
index 4d416c1c507..3c9b16b0336 100644
--- a/models/public/googlenet-v3/model.yml
+++ b/models/public/googlenet-v3/model.yml
@@ -13,9 +13,9 @@
 # limitations under the License.
 
 description: >-
-  The `googlenet-v3` model is the first of the Inception family of models designed
-  to perform image classification. Like the other Inception models. For details
-  about this family of models, check out the paper <https://arxiv.org/pdf/1602.07261.pdf>.
+  The "googlenet-v3" model is the first of the Inception family of models designed
+  to perform image classification. For details about this family of models, check
+  out the paper <https://arxiv.org/pdf/1602.07261.pdf>.
 task_type: classification
 files:
   - name: googlenet-v3.tar.gz
diff --git a/models/public/googlenet-v4-tf/freeze.py.patch b/models/public/googlenet-v4-tf/freeze.py.patch
new file mode 100644
index 00000000000..a4c8ab04b23
--- /dev/null
+++ b/models/public/googlenet-v4-tf/freeze.py.patch
@@ -0,0 +1,57 @@
+diff --git a/research/slim/freeze.py b/research/slim/freeze.py
+new file mode 100644
+index 0000000..411001d
+--- /dev/null
++++ b/research/slim/freeze.py
+@@ -0,0 +1,62 @@
++import argparse
++import os
++import tensorflow as tf
++from tensorflow.python.framework import graph_io
++
++from nets import nets_factory
++
++def parse_args():
++    """Parse input arguments"""
++
++    parser = argparse.ArgumentParser(description='Freeze models from TF Slim')
++
++    parser.add_argument('--ckpt', type=str, required=True,
++                        help='Path to .ckpt file')
++    parser.add_argument('--name', type=str, required=True,
++                        help='Model name')
++    parser.add_argument('--num_classes', type=int, required=True,
++                        help='Number of classes')
++    parser.add_argument('--output', type=str, required=True,
++                        help='Name of output node')
++    return parser.parse_args()
++
++def convert(model_name, ckpt, num_classes, output=None):
++    tf.logging.set_verbosity(tf.logging.INFO)
++
++    with tf.Graph().as_default() as graph, tf.Session() as sess:
++        network_fn = nets_factory.get_network_fn(model_name, num_classes=num_classes, is_training=False)
++
++        size = network_fn.default_image_size
++        placeholder = tf.placeholder(name='input', dtype=tf.float32, shape=(1, size, size, 3))
++        network_fn(placeholder)
++
++        frozen = ckpt.replace('ckpt', 'frozen.pb')
++
++        tf.train.Saver().restore(sess, ckpt)
++        frozen_graph_def = tf.graph_util.convert_variables_to_constants(
++            sess, graph.as_graph_def(), [output])
++
++        print('Writing {}'.format(frozen))
++        graph_io.write_graph(frozen_graph_def, os.path.dirname(frozen), frozen, as_text=False)
++
++
++def main():
++    args = parse_args()
++    convert(args.name, args.ckpt, args.num_classes, args.output)
++
++    print('Done')
++
++
++if __name__ == '__main__':
++    main()
diff --git a/models/public/googlenet-v4-tf/googlenet-v4-tf.md b/models/public/googlenet-v4-tf/googlenet-v4-tf.md
new file mode 100644
index 00000000000..ea4316828b9
--- /dev/null
+++ b/models/public/googlenet-v4-tf/googlenet-v4-tf.md
@@ -0,0 +1,100 @@
+# googlenet-v4-tf
+
+## Use Case and High-Level Description
+
+The `googlenet-v4-tf` model is the most recent of the Inception family of models designed to perform image classification.
+Like the other Inception models, the `googlenet-v4-tf` model has been pretrained on the ImageNet image database.
+Originally redistributed as a checkpoint file, was converted to frozen graph.
+For details about this family of models, check out the [paper](https://arxiv.org/pdf/1602.07261.pdf), [repository](https://github.com/tensorflow/models/tree/master/research/slim).
+
+### Steps to Reproduce Conversion to Frozen Graph
+
+1. Clone the original repository
+```sh
+git clone https://github.com/tensorflow/models.git
+cd models/research/slim
+```
+2. Checkout the commit that the conversion was tested on:
+```sh
+git checkout 5d36f19
+```
+3. Apply `freeze.py.patch` patch
+```sh
+git apply path/to/freeze.py.patch
+```
+4. Download the [pretrained weights](http://download.tensorflow.org/models/inception_v4_2016_09_09.tar.gz)
+5. Install the dependencies:
+```sh
+pip install tensorflow==1.14.0
+```
+6. Run
+```sh
+python3 freeze.py --ckpt path/to/inception_v4.ckpt --name inception_v4 --num_classes 1001 --output InceptionV4/Logits/Predictions
+```
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 24.584        |
+| MParams           | 42.648        |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 80.21          | 80.21           |
+| Top 5  | 95.20          | 95.20           |
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `input`, shape - `1,299,299,3`, format is `B,H,W,C` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`.
+Mean values - [127.5, 127.5, 127.5], scale value - 127.5
+
+### Converted model
+
+Image,  name - `data`, shape - `1,3,299,299`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `InceptionV4/Logits/Predictions`,  shape - `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `InceptionV4/Logits/Predictions`,  shape - `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://github.com/tensorflow/models/blob/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/googlenet-v4-tf/model.yml b/models/public/googlenet-v4-tf/model.yml
new file mode 100644
index 00000000000..b6acae6c726
--- /dev/null
+++ b/models/public/googlenet-v4-tf/model.yml
@@ -0,0 +1,35 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  The `googlenet-v4-tf` model is the most recent of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  family of models designed to perform image classification. Like the other Inception
+  models, the `googlenet-v4-tf` model has been pretrained on the ImageNet image database.
+  For details about this family of models, check out the paper.
+task_type: classification
+files:
+  - name: inception_v4.frozen.pb
+    size: 171245469
+    sha256: 51fedf837e57f18c110c6a55e4e929bb065541533208392207c3f0de9f77d53c
+    source: https://download.01.org/opencv/public_models/012020/googlenet-v4-tf/inception_v4.frozen.pb
+model_optimizer_args:
+  - --input_shape=[1,299,299,3]
+  - --input=input
+  - --mean_values=input[127.5,127.5,127.5]
+  - --scale_values=input[127.5]
+  - --output=InceptionV4/Logits/Predictions
+  - --input_model=$dl_dir/inception_v4.frozen.pb
+  - --reverse_input_channels
+framework: tf
+license: https://github.com/tensorflow/models/blob/master/LICENSE
diff --git a/models/public/googlenet-v4/googlenet-v4.md b/models/public/googlenet-v4/googlenet-v4.md
index d13a75ff7b2..8de98ba69f5 100644
--- a/models/public/googlenet-v4/googlenet-v4.md
+++ b/models/public/googlenet-v4/googlenet-v4.md
@@ -68,4 +68,29 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/soeaver/caffe-model/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/soeaver/caffe-model/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2017 soeaver Yang
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/googlenet-v4/model.yml b/models/public/googlenet-v4/model.yml
index c880f7914a8..77ee4cffb41 100644
--- a/models/public/googlenet-v4/model.yml
+++ b/models/public/googlenet-v4/model.yml
@@ -13,18 +13,18 @@
 # limitations under the License.
 
 description: >-
-  The `googlenet-v4` model is the most recent of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  The "googlenet-v4" model is the most recent of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
   family of models designed to perform image classification. Like the other Inception
-  models, the `googlenet-v4` model has been pretrained on the ImageNet image database.
+  models, the "googlenet-v4" model has been pretrained on the ImageNet image database.
   For details about this family of models, check out the paper.
 
-  The model input is a blob that consists of a single image of 1x3x299x299 in
-  BGR order. The BGR mean values need to be subtracted as follows: [128.0,128.0,128.0]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0078125.
+  The model input is a blob that consists of a single image of 1x3x299x299 in BGR
+  order. The BGR mean values need to be subtracted as follows: [128.0,128.0,128.0]
+  before passing the image blob into the network. In addition, values must be divided
+  by 0.0078125.
 
-  The model output for `googlenet-v4` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "googlenet-v4" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: googlenet-v4.prototxt
diff --git a/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.jpg b/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.jpg
new file mode 100644
index 00000000000..b151c7a8284
Binary files /dev/null and b/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.jpg differ
diff --git a/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.md b/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.md
new file mode 100644
index 00000000000..0d40b3c8313
--- /dev/null
+++ b/models/public/human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.md
@@ -0,0 +1,44 @@
+# human-pose-estimation-3d-0001
+
+## Use Case and High-Level Description
+
+Multi-person 3D human pose estimation model based on the [Lightweight OpenPose](https://arxiv.org/pdf/1811.12004.pdf) and [Single-Shot Multi-Person 3D Pose Estimation From Monocular RGB](https://arxiv.org/pdf/1712.03453.pdf) papers.
+
+## Example
+
+![](./human-pose-estimation-3d-0001.jpg)
+
+## Specification
+
+| Metric                                                        | Value                   |
+|---------------------------------------------------------------|-------------------------|
+| MPJPE (mm)                                                    | 100.45                  |
+| GFlops                                                        | 18.998                  |
+| MParams                                                       | 5.074                   |
+| Source framework                                              | PyTorch\*               |
+
+## Performance
+
+## Inputs
+
+1. Name: `data`, shape: `[1x3x256x448]`. An input image in the `[BxCxHxW]` format,
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order is BGR.
+
+## Outputs
+
+The net outputs three blobs with the following shapes: `[1, 57, 32, 56]`, `[1, 19, 32, 56]`, and `[1, 38, 32, 56]`. The first blob contains coordinates in 3D space, the second blob contains keypoint heatmaps and the third blob is keypoint pairwise relations (part affinity fields).
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../../licenses/APACHE-2.0.txt).
+
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/human-pose-estimation-3d-0001/model.yml b/models/public/human-pose-estimation-3d-0001/model.yml
new file mode 100644
index 00000000000..a2fe9ca3377
--- /dev/null
+++ b/models/public/human-pose-estimation-3d-0001/model.yml
@@ -0,0 +1,46 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Multi-person 3D human pose estimation model based on the Lightweight OpenPose <https://arxiv.org/pdf/1811.12004.pdf>
+  and Single-Shot Multi-Person 3D Pose Estimation From Monocular RGB <https://arxiv.org/pdf/1712.03453.pdf>
+  papers.
+task_type: human_pose_estimation
+files:
+  - name: human-pose-estimation-3d-0001.tar.gz
+    sha256: d2b158f07bd2f3d921bde1215829ac99afc7e63868d2d6738b24c7079db54efc
+    size: 18421831
+    source: https://download.01.org/opencv/openvino_training_extensions/models/human_pose_estimation/human-pose-estimation-3d.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: human-pose-estimation-3d-0001.tar.gz
+framework: pytorch
+conversion_to_onnx_args:
+  - --model-path=$dl_dir
+  - --model-name=PoseEstimationWithMobileNet
+  - --model-param=is_convertible_by_mo=True
+  - --import-module=model
+  - --weights=$dl_dir/human-pose-estimation-3d-0001.pth
+  - --input-shape=1,3,256,448
+  - --input-names=data
+  - --output-names=features,heatmaps,pafs
+  - --output-file=$conv_dir/human-pose-estimation-3d-0001.onnx
+model_optimizer_args:
+  - --input=data
+  - --mean_values=data[128.0,128.0,128.0]
+  - --scale_values=data[255.0,255.0,255.0]
+  - --output=features,heatmaps,pafs
+  - --input_model=$conv_dir/human-pose-estimation-3d-0001.onnx
+license: https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE
diff --git a/models/public/inception-resnet-v2-tf/inception-resnet-v2-tf.md b/models/public/inception-resnet-v2-tf/inception-resnet-v2-tf.md
index 6af30fc7ac8..94162aa00c9 100644
--- a/models/public/inception-resnet-v2-tf/inception-resnet-v2-tf.md
+++ b/models/public/inception-resnet-v2-tf/inception-resnet-v2-tf.md
@@ -60,4 +60,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/inception-resnet-v2-tf/model.yml b/models/public/inception-resnet-v2-tf/model.yml
index 2a553850207..704da84e1a4 100644
--- a/models/public/inception-resnet-v2-tf/model.yml
+++ b/models/public/inception-resnet-v2-tf/model.yml
@@ -13,9 +13,9 @@
 # limitations under the License.
 
 description: >-
-  The `inception-resnet-v2` model is one of the Inception family of models designed
-  to perform image classification.1 Like the other Inception models. For details
-  about this family of models, check out the paper <https://arxiv.org/pdf/1602.07261.pdf>.
+  The "inception-resnet-v2" model is one of the Inception family of models designed
+  to perform image classification. For details about this family of models, check
+  out the paper <https://arxiv.org/pdf/1602.07261.pdf>.
 task_type: classification
 files:
   - name: inception_resnet_v2_2018_04_27.tgz
diff --git a/models/public/inception-resnet-v2/inception-resnet-v2.md b/models/public/inception-resnet-v2/inception-resnet-v2.md
index e6d8df4c123..6e916e5c999 100644
--- a/models/public/inception-resnet-v2/inception-resnet-v2.md
+++ b/models/public/inception-resnet-v2/inception-resnet-v2.md
@@ -68,4 +68,29 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/soeaver/caffe-model/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/soeaver/caffe-model/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2017 soeaver Yang
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/inception-resnet-v2/model.yml b/models/public/inception-resnet-v2/model.yml
index d1105747bb4..31494a2fc7c 100644
--- a/models/public/inception-resnet-v2/model.yml
+++ b/models/public/inception-resnet-v2/model.yml
@@ -13,19 +13,18 @@
 # limitations under the License.
 
 description: >-
-  The `inception-resnet-v2` model is one of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
+  The "inception-resnet-v2" model is one of the Inception <https://arxiv.org/pdf/1602.07261.pdf>
   family of models designed to perform image classification.1 Like the other Inception
-  models, the `inception-resnet-v2` model has been pretrained on the ImageNet
-  image database. For details about this family of models, check out the paper.
+  models, the "inception-resnet-v2" model has been pretrained on the ImageNet image
+  database. For details about this family of models, check out the paper.
 
-  The model input is a blob that consists of a single image of 1x3x299x299 in
-  BGR order. The BGR mean values need to be subtracted as follows: [128.0,128.0,128.0]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0078125.
+  The model input is a blob that consists of a single image of 1x3x299x299 in BGR
+  order. The BGR mean values need to be subtracted as follows: [128.0,128.0,128.0]
+  before passing the image blob into the network. In addition, values must be divided
+  by 0.0078125.
 
-  The model output for `inception-resnet-v2` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The model output for "inception-resnet-v2" is the typical object classifier output
+  for the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: inception-resnet-v2.prototxt
diff --git a/models/public/index.md b/models/public/index.md
index 6a1d273dd28..41558407fe3 100644
--- a/models/public/index.md
+++ b/models/public/index.md
@@ -13,14 +13,19 @@ The models can be downloaded via Model Downloader
 | ----------------- | ---------------| -------------- | -------- | ------ | ------- |
 | AlexNet           | [Caffe\*](./alexnet/alexnet.md)       | alexnet   | | 1.5 | 60.965 |
 | CaffeNet          | [Caffe\*](./caffenet/caffenet.md)     | caffenet  | | 1.5 | 60.965 |
-| DenseNet 121      | [Caffe\*](./densenet-121/densenet-121.md)<br>[TensorFlow\*](./densenet-121-tf/densenet-121-tf.md)  | densenet-121<br>densenet-121-tf | | 5.289~5.724    | 7.971 |
+| DenseNet 121      | [Caffe\*](./densenet-121/densenet-121.md)<br>[TensorFlow\*](./densenet-121-tf/densenet-121-tf.md)<br>[Caffe2\*](./densenet-121-caffe2/densenet-121-caffe2.md)  | densenet-121<br>densenet-121-tf<br>densenet-121-caffe2 | | 5.289~5.724    | 7.971 |
 | DenseNet 161      | [Caffe\*](./densenet-161/densenet-161.md)<br> [TensorFlow\*](./densenet-161-tf/densenet-161-tf.md) | densenet-161<br>densenet-161-tf | | 14.128~15.561  | 28.666 |
 | DenseNet 169      | [Caffe\*](./densenet-169/densenet-169.md)<br>[TensorFlow\*](./densenet-169-tf/densenet-169-tf.md)  | densenet-169<br>densenet-169-tf | | 6.16~6.788 | 14.139 |
 | DenseNet 201      | [Caffe\*](./densenet-201/densenet-201.md) | densenet-201 | | 8.673  | 20.001  |
-| Inception (GoogleNet) V1 | [Caffe\*](./googlenet-v1/googlenet-v1.md) | googlenet-v1 | | 3.266 | 6.999 |
+| EfficientNet B0   | [TensorFlow\*](./efficientnet-b0/efficientnet-b0.md)<br>[PyTorch\*](./efficientnet-b0-pytorch/efficientnet-b0-pytorch.md) | efficientnet-b0<br>efficientnet-b0-pytorch | 75.70/92.76<br>76.91/93.21 | 0.819 | 5.268 |
+| EfficientNet B0 AutoAugment  | [TensorFlow\*](./efficientnet-b0_auto_aug/efficientnet-b0_auto_aug.md) | efficientnet-b0_auto_aug | 76.43/93.04 | 0.819 | 5.268 |
+| EfficientNet B5   | [TensorFlow\*](./efficientnet-b5/efficientnet-b5.md)<br>[PyTorch\*](./efficientnet-b5-pytorch/efficientnet-b5-pytorch.md) | efficientnet-b5<br>efficientnet-b5-pytorch | 83.33/96.67<br>83.69/96.71 | 21.252 | 30.303 | 
+| EfficientNet B7   | [PyTorch\*](./efficientnet-b7-pytorch/efficientnet-b7-pytorch.md) | efficientnet-b7-pytorch | 84.42/96.91 | 77.618  | 66.193 |
+| EfficientNet B7 AutoAugment  | [TensorFlow\*](./efficientnet-b7_auto_aug/efficientnet-b7_auto_aug.md) | efficientnet-b7_auto_aug | 84.68/97.09 | 77.618  | 66.193 |
+| Inception (GoogleNet) V1 | [Caffe\*](./googlenet-v1/googlenet-v1.md)<br>[TensorFlow\*](./googlenet-v1-tf/googlenet-v1-tf.md) | googlenet-v1<br>googlenet-v1-tf | | 3.016~3.266 | 6.619~6.999 |
 | Inception (GoogleNet) V2 | [Caffe\*](./googlenet-v2/googlenet-v2.md) | googlenet-v2 | | 4.058 | 11.185 |
 | Inception (GoogleNet) V3 | [Caffe\*](./googlenet-v3/googlenet-v3.md)<br>[PyTorch\*](./googlenet-v3-pytorch/googlenet-v3-pytorch.md) | googlenet-v3 <br> googlenet-v3-pytorch |  | 11.469 | 23.817 |
-| Inception (GoogleNet) V4 | [Caffe\*](./googlenet-v4/googlenet-v4.md) | googlenet-v4| | 24.584 | 42.648 |
+| Inception (GoogleNet) V4 | [Caffe\*](./googlenet-v4/googlenet-v4.md)<br>[TensorFlow\*](./googlenet-v4-tf/googlenet-v4-tf.md) | googlenet-v4<br>googlenet-v4-tf | | 24.584 | 42.648 |
 | Inception-ResNet V2      | [Caffe\*](./inception-resnet-v2/inception-resnet-v2.md)<br>[TensorFlow\*](./inception-resnet-v2-tf/inception-resnet-v2-tf.md) | inception-resnet-v2 <br>  inception-resnet-v2-tf | | 22.227~26.405 | 30.223~55.813 |
 | MobileNet V1 0.25 128 | [Caffe\*](./mobilenet-v1-0.25-128/mobilenet-v1-0.25-128.md) | mobilenet-v1-0.25-128 | | 0.028 | 0.468 | 
 | MobileNet V1 0.5 160 | [Caffe\*](./mobilenet-v1-0.50-160/mobilenet-v1-0.50-160.md)  | mobilenet-v1-0.50-160 | | 0.156 | 1.327 |
@@ -28,7 +33,7 @@ The models can be downloaded via Model Downloader
 | MobileNet V1 1.0 224 | [Caffe\*](./mobilenet-v1-1.0-224/mobilenet-v1-1.0-224.md)<br>[TensorFlow\*](./mobilenet-v1-1.0-224-tf/mobilenet-v1-1.0-224-tf.md) | mobilenet-v1-1.0-224 <br> mobilenet-v1-1.0-224-tf | | 1.148 | 4.221 |
 | MobileNet V2 1.0 224 | [Caffe\*](./mobilenet-v2/mobilenet-v2.md)<br>[TensorFlow\*](./mobilenet-v2-1.0-224/mobilenet-v2-1.0-224.md)<br>[PyTorch\*](./mobilenet-v2-pytorch/mobilenet-v2-pytorch.md) | mobilenet-v2 <br>  mobilenet-v2-1.0-224 <br> mobilenet-v2-pytorch | | 0.615~0.876 | 3.489 |
 | MobileNet V2 1.4 224 | [TensorFlow\*](./mobilenet-v2-1.4-224/mobilenet-v2-1.4-224.md)  | mobilenet-v2-1.4-224 | | 1.183  | 6.087 |
-| ResNet 50            | [Caffe\*](./resnet-50/resnet-50.md) <br> [PyTorch\*](./resnet-50-pytorch/resnet-50-pytorch.md) | resnet-50 <br> resnet-50-pytorch | | 6.996~8.216 | 25.53 |
+| ResNet 50            | [Caffe\*](./resnet-50/resnet-50.md) <br> [PyTorch\*](./resnet-50-pytorch/resnet-50-pytorch.md)<br>[Caffe2\*](./resnet-50-caffe2/resnet-50-caffe2.md)<br>[TensorFlow\*](./resnet-50-tf/resnet-50-tf.md) | resnet-50 <br> resnet-50-pytorch<br>resnet-50-caffe2<br>resnet-50-tf | | 6.996~8.216 | 25.53 |
 | ResNet 101           | [Caffe\*](./resnet-101/resnet-101.md) | resnet-101 | | 14.441 | 44.496 |
 | ResNet 152           | [Caffe\*](./resnet-152/resnet-152.md) | resnet-152 | | 21.89 | 60.117 |
 | SE-Inception         | [Caffe\*](./se-inception/se-inception.md)      | se-inception | | 4.091 | 11.922 |
@@ -38,9 +43,9 @@ The models can be downloaded via Model Downloader
 | SE-ResNeXt 50        | [Caffe\*](./se-resnext-50/se-resnext-50.md)    | se-resnext-50 | | 8.533 | 27.526|
 | SE-ResNeXt 101       | [Caffe\*](./se-resnext-101/se-resnext-101.md)  | se-resnext-101 | | 16.054 | 48.886 |
 | SqueezeNet v1.0      | [Caffe\*](./squeezenet1.0/squeezenet1.0.md)    | squeezenet1.0| | 1.737 | 1.248 |
-| SqueezeNet v1.1      | [Caffe\*](./squeezenet1.1/squeezenet1.1.md)    | squeezenet1.1| | 0.785 | 1.236 |
+| SqueezeNet v1.1      | [Caffe\*](./squeezenet1.1/squeezenet1.1.md)<br>[Caffe2\*](./squeezenet1.1-caffe2/squeezenet1.1-caffe2.md)    | squeezenet1.1<br>squeezenet1.1-caffe2| | 0.785 | 1.236 |
 | VGG 16               | [Caffe\*](./vgg16/vgg16.md) | vgg16 | | 30.974 | 138.358 |
-| VGG 19               | [Caffe\*](./vgg19/vgg19.md) | vgg19 | | 39.3 | 143.667  |
+| VGG 19               | [Caffe\*](./vgg19/vgg19.md)<br>[Caffe2\*](./vgg19-caffe2/vgg19-caffe2.md) | vgg19<br>vgg19-caffe2 | | 39.3 | 143.667  |
 
 **Octave Convolutions Networks**
 
@@ -100,11 +105,14 @@ SSD-based and provide reasonable accuracy/performance trade-offs.
 | Model Name                | Implementation | OMZ Model Name | GFlops | mParams |
 | ------------------------- | -------------- | -------------- | ------ | ------- |
 | CTPN                      | [TensorFlow\*](./ctpn/ctpn.md) | ctpn | 55.813 | 17.237 | |
+| CenterNet (CTDET with DLAV0) 384x384 | [ONNX\*](./ctdet_coco_dlav0_384/ctdet_coco_dlav0_384.md) | ctdet_coco_dlav0_384| 34.994 | 17.911 | |
+| CenterNet (CTDET with DLAV0) 512x512 | [ONNX\*](./ctdet_coco_dlav0_512/ctdet_coco_dlav0_512.md) | ctdet_coco_dlav0_512| 62.211 | 17.911 | |
 | Faster R-CNN with Inception-ResNet v2 | [TensorFlow\*](./faster_rcnn_inception_resnet_v2_atrous_coco/faster_rcnn_inception_resnet_v2_atrous_coco.md) | faster_rcnn_inception_resnet_v2_atrous_coco| 30.687 | 13.307 |
 | Faster R-CNN with Inception v2 | [TensorFlow\*](./faster_rcnn_inception_v2_coco/faster_rcnn_inception_v2_coco.md) | faster_rcnn_inception_v2_coco | 30.687 | 13.307 |
 | Faster R-CNN with ResNet 50    | [TensorFlow\*](./faster_rcnn_resnet50_coco/faster_rcnn_resnet50_coco.md) | faster_rcnn_resnet50_coco | 57.203 | 29.162 |
 | Faster R-CNN with ResNet 101   | [TensorFlow\*](./faster_rcnn_resnet101_coco/faster_rcnn_resnet101_coco.md) |faster_rcnn_resnet101_coco | 112.052 | 48.128 |
 | MTCNN                     | Caffe\*: <br>[proposal](./mtcnn-p/mtcnn-p.md) <br>[refine](./mtcnn-r/mtcnn-r.md) <br> [output](./mtcnn-o/mtcnn-o.md) | <br>mtcnn-p <br>mtcnn-r <br>mtcnn-o| | |
+| R-FCN with Resnet-101     | [TensorFlow\*](./rfcn-resnet101-coco-tf/rfcn-resnet101-coco-tf.md) | rfcn-resnet101-coco-tf | 53.462 | 171.85 |
 | SSD 300                   | [Caffe\*](./ssd300/ssd300.md) | ssd300 | 62.815 | 26.285 |
 | SSD 512                   | [Caffe\*](./ssd512/ssd512.md) | ssd512 | 180.611 | 27.189 |
 | SSD with MobileNet        | [Caffe\*](./mobilenet-ssd/mobilenet-ssd.md) <br>[TensorFlow\*](./ssd_mobilenet_v1_coco/ssd_mobilenet_v1_coco.md) | mobilenet-ssd <br>ssd_mobilenet_v1_coco | 2.316~2.494 | 5.783~6.807 |
@@ -123,6 +131,22 @@ SSD-based and provide reasonable accuracy/performance trade-offs.
 | MobileFaceNet,ArcFace@ms1m-refine-v1 | [MXNet\*](./face-recognition-mobilefacenet-arcface/face-recognition-mobilefacenet-arcface.md) | face-recognition-mobilefacenet-arcface | 0.449 | 0.993 |
 | SphereFace                | [Caffe\*](./Sphereface/Sphereface.md) | Sphereface | 3.504 | 22.671 |
 
+## Human Pose Estimation
+
+Human pose estimation task is to predict a pose: body skeleton, which consists
+of keypoints and connections between them, for every person in an input image or
+video. Keypoints are body joints, i.e. ears, eyes, nose, shoulders, knees, etc.
+There are two major groups of such metods: top-down and bottom-up.  The first
+detects persons in a given frame, crops or rescales detections, then runs pose
+estimation network for every detection. These methods are very accurate. The
+second finds all keypoints in a given frame, then groups them by person
+instances, thus faster than previous, because network runs once.
+
+| Model Name                    | Implementation                                                                            | OMZ Model Name                | GFlops | mParams |
+|------------------------------ | ----------------------------------------------------------------------------------------- | ----------------------------- | ------ | ------- |
+| human-pose-estimation-3d-0001 | [PyTorch\*](./human-pose-estimation-3d-0001/description/human-pose-estimation-3d-0001.md) | human-pose-estimation-3d-0001 | 18.998 |  5.074  |
+|single-human-pose-estimation-0001| [PyTorch\*](./single-human-pose-estimation-0001/description/single-human-pose-estimation-0001.md) | single-human-pose-estimation-0001 | 60.125 | 33.165 |
+
 ## Legal Information
 
 [*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.md b/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.md
new file mode 100644
index 00000000000..f3a6fce8dfb
--- /dev/null
+++ b/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.md
@@ -0,0 +1,219 @@
+# license-plate-recognition-barrier-0007
+
+## Use Case and High-Level Description
+
+This model uses a small-footprint network trained end-to-end to recognize
+Chinese license plates in traffic.
+
+## Validation Dataset - Internal
+
+1165 Chinese plates from different provinces
+
+## Example
+
+**Note:** The license plates on the image were modified to protect the owners' privacy.
+
+![](./license-plate-recognition-barrier-0007.png)
+
+## Specification
+
+| Metric                 | Value                   |
+|------------------------|-------------------------|
+| Rotation in-plane      | ±10˚                    |
+| Rotation out-of-plane  | Yaw: ±45˚ / Pitch: ±45˚ |
+| Min plate width        | 94 pixels               |
+| Ratio of correct reads | 90.12%                  |
+| GFlops                 | 0.347                   |
+| MParams                | 1.435                   |
+| Source framework       | TensorFlow*             |
+
+## Limitations
+
+Only "blue" license plates, which are common in public, were tested
+thoroughly. Other types of license plates may underperform.
+
+## Performance
+Link to [performance table](https://software.intel.com/en-us/openvino-toolkit/benchmarks)
+
+## Inputs
+
+### Original Model
+
+Image,	name: `data` , shape: `1,3,24,94`, format is `1,C,H,W` where:
+
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+### Converted Model
+
+Image,	name: `data` , shape: `1,3,24,94`, format is `1,C,H,W` where:
+
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Outputs
+
+### Original Model
+
+Encoded vector of floats, name: `decode`, shape: `1,88,1,1`. Each float
+is an integer number encoding a character according to this dictionary:
+
+        0 0
+        1 1
+        2 2
+        3 3
+        4 4
+        5 5
+        6 6
+        7 7
+        8 8
+        9 9
+        10 <Anhui>
+        11 <Beijing>
+        12 <Chongqing>
+        13 <Fujian>
+        14 <Gansu>
+        15 <Guangdong>
+        16 <Guangxi>
+        17 <Guizhou>
+        18 <Hainan>
+        19 <Hebei>
+        20 <Heilongjiang>
+        21 <Henan>
+        22 <HongKong>
+        23 <Hubei>
+        24 <Hunan>
+        25 <InnerMongolia>
+        26 <Jiangsu>
+        27 <Jiangxi>
+        28 <Jilin>
+        29 <Liaoning>
+        30 <Macau>
+        31 <Ningxia>
+        32 <Qinghai>
+        33 <Shaanxi>
+        34 <Shandong>
+        35 <Shanghai>
+        36 <Shanxi>
+        37 <Sichuan>
+        38 <Tianjin>
+        39 <Tibet>
+        40 <Xinjiang>
+        41 <Yunnan>
+        42 <Zhejiang>
+        43 <police>
+        44 A
+        45 B
+        46 C
+        47 D
+        48 E
+        49 F
+        50 G
+        51 H
+        52 I
+        53 J
+        54 K
+        55 L
+        56 M
+        57 N
+        58 O
+        59 P
+        60 Q
+        61 R
+        62 S
+        63 T
+        64 U
+        65 V
+        66 W
+        67 X
+        68 Y
+        69 Z
+
+### Converted Model
+
+Encoded vector of floats, name: `decode`, shape: `1,88,1,1`. Each float
+is an integer number encoding a character according to this dictionary:
+
+        0 0
+        1 1
+        2 2
+        3 3
+        4 4
+        5 5
+        6 6
+        7 7
+        8 8
+        9 9
+        10 <Anhui>
+        11 <Beijing>
+        12 <Chongqing>
+        13 <Fujian>
+        14 <Gansu>
+        15 <Guangdong>
+        16 <Guangxi>
+        17 <Guizhou>
+        18 <Hainan>
+        19 <Hebei>
+        20 <Heilongjiang>
+        21 <Henan>
+        22 <HongKong>
+        23 <Hubei>
+        24 <Hunan>
+        25 <InnerMongolia>
+        26 <Jiangsu>
+        27 <Jiangxi>
+        28 <Jilin>
+        29 <Liaoning>
+        30 <Macau>
+        31 <Ningxia>
+        32 <Qinghai>
+        33 <Shaanxi>
+        34 <Shandong>
+        35 <Shanghai>
+        36 <Shanxi>
+        37 <Sichuan>
+        38 <Tianjin>
+        39 <Tibet>
+        40 <Xinjiang>
+        41 <Yunnan>
+        42 <Zhejiang>
+        43 <police>
+        44 A
+        45 B
+        46 C
+        47 D
+        48 E
+        49 F
+        50 G
+        51 H
+        52 I
+        53 J
+        54 K
+        55 L
+        56 M
+        57 N
+        58 O
+        59 P
+        60 Q
+        61 R
+        62 S
+        63 T
+        64 U
+        65 V
+        66 W
+        67 X
+        68 Y
+        69 Z
+
+## Legal Information
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE).
+A copy of the license is provided in [APACHE-2.0](../licenses/APACHE-2.0.txt).
+
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.png b/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.png
new file mode 100644
index 00000000000..3ea1e02c538
Binary files /dev/null and b/models/public/license-plate-recognition-barrier-0007/license-plate-recognition-barrier-0007.png differ
diff --git a/models/public/license-plate-recognition-barrier-0007/model.yml b/models/public/license-plate-recognition-barrier-0007/model.yml
index b960e517289..d99737a36bb 100644
--- a/models/public/license-plate-recognition-barrier-0007/model.yml
+++ b/models/public/license-plate-recognition-barrier-0007/model.yml
@@ -12,7 +12,9 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-description: TensorFlow LPRNet
+description: >-
+  This model uses a small-footprint network trained end-to-end to recognize Chinese
+  license plates in traffic.
 task_type: optical_character_recognition
 files:
   - name: license-plate-recognition-barrier-0007.tar.gz
diff --git a/models/public/licenses/APACHE-2.0-PyTorch-EfficientNet.txt b/models/public/licenses/APACHE-2.0-PyTorch-EfficientNet.txt
new file mode 100644
index 00000000000..4336819097f
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0-PyTorch-EfficientNet.txt
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "{}"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2019 Ross Wightman
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/APACHE-2.0-SENet.txt b/models/public/licenses/APACHE-2.0-SENet.txt
new file mode 100644
index 00000000000..8dada3edaf5
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0-SENet.txt
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "{}"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright {yyyy} {name of copyright owner}
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/APACHE-2.0-TF-DenseNet.txt b/models/public/licenses/APACHE-2.0-TF-DenseNet.txt
new file mode 100644
index 00000000000..8dada3edaf5
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0-TF-DenseNet.txt
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "{}"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright {yyyy} {name of copyright owner}
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/APACHE-2.0-TF-TPU.txt b/models/public/licenses/APACHE-2.0-TF-TPU.txt
new file mode 100644
index 00000000000..15ae4214045
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0-TF-TPU.txt
@@ -0,0 +1,203 @@
+Copyright 2017 The TensorFlow Authors.  All rights reserved.
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2017, The TensorFlow Authors.
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/APACHE-2.0-TensorFlow.txt b/models/public/licenses/APACHE-2.0-TensorFlow.txt
new file mode 100644
index 00000000000..43fcf7bf1f1
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0-TensorFlow.txt
@@ -0,0 +1,203 @@
+Copyright 2016 The TensorFlow Authors.  All rights reserved.
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2016, The Authors.
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/APACHE-2.0.txt b/models/public/licenses/APACHE-2.0.txt
new file mode 100644
index 00000000000..d6456956733
--- /dev/null
+++ b/models/public/licenses/APACHE-2.0.txt
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/models/public/licenses/CC-BY-4.0.txt b/models/public/licenses/CC-BY-4.0.txt
new file mode 100644
index 00000000000..da6ab6cc8f3
--- /dev/null
+++ b/models/public/licenses/CC-BY-4.0.txt
@@ -0,0 +1,396 @@
+Attribution 4.0 International
+
+=======================================================================
+
+Creative Commons Corporation ("Creative Commons") is not a law firm and
+does not provide legal services or legal advice. Distribution of
+Creative Commons public licenses does not create a lawyer-client or
+other relationship. Creative Commons makes its licenses and related
+information available on an "as-is" basis. Creative Commons gives no
+warranties regarding its licenses, any material licensed under their
+terms and conditions, or any related information. Creative Commons
+disclaims all liability for damages resulting from their use to the
+fullest extent possible.
+
+Using Creative Commons Public Licenses
+
+Creative Commons public licenses provide a standard set of terms and
+conditions that creators and other rights holders may use to share
+original works of authorship and other material subject to copyright
+and certain other rights specified in the public license below. The
+following considerations are for informational purposes only, are not
+exhaustive, and do not form part of our licenses.
+
+     Considerations for licensors: Our public licenses are
+     intended for use by those authorized to give the public
+     permission to use material in ways otherwise restricted by
+     copyright and certain other rights. Our licenses are
+     irrevocable. Licensors should read and understand the terms
+     and conditions of the license they choose before applying it.
+     Licensors should also secure all rights necessary before
+     applying our licenses so that the public can reuse the
+     material as expected. Licensors should clearly mark any
+     material not subject to the license. This includes other CC-
+     licensed material, or material used under an exception or
+     limitation to copyright. More considerations for licensors:
+    wiki.creativecommons.org/Considerations_for_licensors
+
+     Considerations for the public: By using one of our public
+     licenses, a licensor grants the public permission to use the
+     licensed material under specified terms and conditions. If
+     the licensor's permission is not necessary for any reason--for
+     example, because of any applicable exception or limitation to
+     copyright--then that use is not regulated by the license. Our
+     licenses grant only permissions under copyright and certain
+     other rights that a licensor has authority to grant. Use of
+     the licensed material may still be restricted for other
+     reasons, including because others have copyright or other
+     rights in the material. A licensor may make special requests,
+     such as asking that all changes be marked or described.
+     Although not required by our licenses, you are encouraged to
+     respect those requests where reasonable. More considerations
+     for the public:
+    wiki.creativecommons.org/Considerations_for_licensees
+
+=======================================================================
+
+Creative Commons Attribution 4.0 International Public License
+
+By exercising the Licensed Rights (defined below), You accept and agree
+to be bound by the terms and conditions of this Creative Commons
+Attribution 4.0 International Public License ("Public License"). To the
+extent this Public License may be interpreted as a contract, You are
+granted the Licensed Rights in consideration of Your acceptance of
+these terms and conditions, and the Licensor grants You such rights in
+consideration of benefits the Licensor receives from making the
+Licensed Material available under these terms and conditions.
+
+
+Section 1 -- Definitions.
+
+  a. Adapted Material means material subject to Copyright and Similar
+     Rights that is derived from or based upon the Licensed Material
+     and in which the Licensed Material is translated, altered,
+     arranged, transformed, or otherwise modified in a manner requiring
+     permission under the Copyright and Similar Rights held by the
+     Licensor. For purposes of this Public License, where the Licensed
+     Material is a musical work, performance, or sound recording,
+     Adapted Material is always produced where the Licensed Material is
+     synched in timed relation with a moving image.
+
+  b. Adapter's License means the license You apply to Your Copyright
+     and Similar Rights in Your contributions to Adapted Material in
+     accordance with the terms and conditions of this Public License.
+
+  c. Copyright and Similar Rights means copyright and/or similar rights
+     closely related to copyright including, without limitation,
+     performance, broadcast, sound recording, and Sui Generis Database
+     Rights, without regard to how the rights are labeled or
+     categorized. For purposes of this Public License, the rights
+     specified in Section 2(b)(1)-(2) are not Copyright and Similar
+     Rights.
+
+  d. Effective Technological Measures means those measures that, in the
+     absence of proper authority, may not be circumvented under laws
+     fulfilling obligations under Article 11 of the WIPO Copyright
+     Treaty adopted on December 20, 1996, and/or similar international
+     agreements.
+
+  e. Exceptions and Limitations means fair use, fair dealing, and/or
+     any other exception or limitation to Copyright and Similar Rights
+     that applies to Your use of the Licensed Material.
+
+  f. Licensed Material means the artistic or literary work, database,
+     or other material to which the Licensor applied this Public
+     License.
+
+  g. Licensed Rights means the rights granted to You subject to the
+     terms and conditions of this Public License, which are limited to
+     all Copyright and Similar Rights that apply to Your use of the
+     Licensed Material and that the Licensor has authority to license.
+
+  h. Licensor means the individual(s) or entity(ies) granting rights
+     under this Public License.
+
+  i. Share means to provide material to the public by any means or
+     process that requires permission under the Licensed Rights, such
+     as reproduction, public display, public performance, distribution,
+     dissemination, communication, or importation, and to make material
+     available to the public including in ways that members of the
+     public may access the material from a place and at a time
+     individually chosen by them.
+
+  j. Sui Generis Database Rights means rights other than copyright
+     resulting from Directive 96/9/EC of the European Parliament and of
+     the Council of 11 March 1996 on the legal protection of databases,
+     as amended and/or succeeded, as well as other essentially
+     equivalent rights anywhere in the world.
+
+  k. You means the individual or entity exercising the Licensed Rights
+     under this Public License. Your has a corresponding meaning.
+
+
+Section 2 -- Scope.
+
+  a. License grant.
+
+       1. Subject to the terms and conditions of this Public License,
+          the Licensor hereby grants You a worldwide, royalty-free,
+          non-sublicensable, non-exclusive, irrevocable license to
+          exercise the Licensed Rights in the Licensed Material to:
+
+            a. reproduce and Share the Licensed Material, in whole or
+               in part; and
+
+            b. produce, reproduce, and Share Adapted Material.
+
+       2. Exceptions and Limitations. For the avoidance of doubt, where
+          Exceptions and Limitations apply to Your use, this Public
+          License does not apply, and You do not need to comply with
+          its terms and conditions.
+
+       3. Term. The term of this Public License is specified in Section
+          6(a).
+
+       4. Media and formats; technical modifications allowed. The
+          Licensor authorizes You to exercise the Licensed Rights in
+          all media and formats whether now known or hereafter created,
+          and to make technical modifications necessary to do so. The
+          Licensor waives and/or agrees not to assert any right or
+          authority to forbid You from making technical modifications
+          necessary to exercise the Licensed Rights, including
+          technical modifications necessary to circumvent Effective
+          Technological Measures. For purposes of this Public License,
+          simply making modifications authorized by this Section 2(a)
+          (4) never produces Adapted Material.
+
+       5. Downstream recipients.
+
+            a. Offer from the Licensor -- Licensed Material. Every
+               recipient of the Licensed Material automatically
+               receives an offer from the Licensor to exercise the
+               Licensed Rights under the terms and conditions of this
+               Public License.
+
+            b. No downstream restrictions. You may not offer or impose
+               any additional or different terms or conditions on, or
+               apply any Effective Technological Measures to, the
+               Licensed Material if doing so restricts exercise of the
+               Licensed Rights by any recipient of the Licensed
+               Material.
+
+       6. No endorsement. Nothing in this Public License constitutes or
+          may be construed as permission to assert or imply that You
+          are, or that Your use of the Licensed Material is, connected
+          with, or sponsored, endorsed, or granted official status by,
+          the Licensor or others designated to receive attribution as
+          provided in Section 3(a)(1)(A)(i).
+
+  b. Other rights.
+
+       1. Moral rights, such as the right of integrity, are not
+          licensed under this Public License, nor are publicity,
+          privacy, and/or other similar personality rights; however, to
+          the extent possible, the Licensor waives and/or agrees not to
+          assert any such rights held by the Licensor to the limited
+          extent necessary to allow You to exercise the Licensed
+          Rights, but not otherwise.
+
+       2. Patent and trademark rights are not licensed under this
+          Public License.
+
+       3. To the extent possible, the Licensor waives any right to
+          collect royalties from You for the exercise of the Licensed
+          Rights, whether directly or through a collecting society
+          under any voluntary or waivable statutory or compulsory
+          licensing scheme. In all other cases the Licensor expressly
+          reserves any right to collect such royalties.
+
+
+Section 3 -- License Conditions.
+
+Your exercise of the Licensed Rights is expressly made subject to the
+following conditions.
+
+  a. Attribution.
+
+       1. If You Share the Licensed Material (including in modified
+          form), You must:
+
+            a. retain the following if it is supplied by the Licensor
+               with the Licensed Material:
+
+                 i. identification of the creator(s) of the Licensed
+                    Material and any others designated to receive
+                    attribution, in any reasonable manner requested by
+                    the Licensor (including by pseudonym if
+                    designated);
+
+                ii. a copyright notice;
+
+               iii. a notice that refers to this Public License;
+
+                iv. a notice that refers to the disclaimer of
+                    warranties;
+
+                 v. a URI or hyperlink to the Licensed Material to the
+                    extent reasonably practicable;
+
+            b. indicate if You modified the Licensed Material and
+               retain an indication of any previous modifications; and
+
+            c. indicate the Licensed Material is licensed under this
+               Public License, and include the text of, or the URI or
+               hyperlink to, this Public License.
+
+       2. You may satisfy the conditions in Section 3(a)(1) in any
+          reasonable manner based on the medium, means, and context in
+          which You Share the Licensed Material. For example, it may be
+          reasonable to satisfy the conditions by providing a URI or
+          hyperlink to a resource that includes the required
+          information.
+
+       3. If requested by the Licensor, You must remove any of the
+          information required by Section 3(a)(1)(A) to the extent
+          reasonably practicable.
+
+       4. If You Share Adapted Material You produce, the Adapter's
+          License You apply must not prevent recipients of the Adapted
+          Material from complying with this Public License.
+
+
+Section 4 -- Sui Generis Database Rights.
+
+Where the Licensed Rights include Sui Generis Database Rights that
+apply to Your use of the Licensed Material:
+
+  a. for the avoidance of doubt, Section 2(a)(1) grants You the right
+     to extract, reuse, reproduce, and Share all or a substantial
+     portion of the contents of the database;
+
+  b. if You include all or a substantial portion of the database
+     contents in a database in which You have Sui Generis Database
+     Rights, then the database in which You have Sui Generis Database
+     Rights (but not its individual contents) is Adapted Material; and
+
+  c. You must comply with the conditions in Section 3(a) if You Share
+     all or a substantial portion of the contents of the database.
+
+For the avoidance of doubt, this Section 4 supplements and does not
+replace Your obligations under this Public License where the Licensed
+Rights include other Copyright and Similar Rights.
+
+
+Section 5 -- Disclaimer of Warranties and Limitation of Liability.
+
+  a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
+     EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
+     AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
+     ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
+     IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
+     WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
+     PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
+     ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
+     KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
+     ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
+
+  b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
+     TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
+     NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
+     INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
+     COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
+     USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
+     ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
+     DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
+     IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
+
+  c. The disclaimer of warranties and limitation of liability provided
+     above shall be interpreted in a manner that, to the extent
+     possible, most closely approximates an absolute disclaimer and
+     waiver of all liability.
+
+
+Section 6 -- Term and Termination.
+
+  a. This Public License applies for the term of the Copyright and
+     Similar Rights licensed here. However, if You fail to comply with
+     this Public License, then Your rights under this Public License
+     terminate automatically.
+
+  b. Where Your right to use the Licensed Material has terminated under
+     Section 6(a), it reinstates:
+
+       1. automatically as of the date the violation is cured, provided
+          it is cured within 30 days of Your discovery of the
+          violation; or
+
+       2. upon express reinstatement by the Licensor.
+
+     For the avoidance of doubt, this Section 6(b) does not affect any
+     right the Licensor may have to seek remedies for Your violations
+     of this Public License.
+
+  c. For the avoidance of doubt, the Licensor may also offer the
+     Licensed Material under separate terms or conditions or stop
+     distributing the Licensed Material at any time; however, doing so
+     will not terminate this Public License.
+
+  d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
+     License.
+
+
+Section 7 -- Other Terms and Conditions.
+
+  a. The Licensor shall not be bound by any additional or different
+     terms or conditions communicated by You unless expressly agreed.
+
+  b. Any arrangements, understandings, or agreements regarding the
+     Licensed Material not stated herein are separate from and
+     independent of the terms and conditions of this Public License.
+
+
+Section 8 -- Interpretation.
+
+  a. For the avoidance of doubt, this Public License does not, and
+     shall not be interpreted to, reduce, limit, restrict, or impose
+     conditions on any use of the Licensed Material that could lawfully
+     be made without permission under this Public License.
+
+  b. To the extent possible, if any provision of this Public License is
+     deemed unenforceable, it shall be automatically reformed to the
+     minimum extent necessary to make it enforceable. If the provision
+     cannot be reformed, it shall be severed from this Public License
+     without affecting the enforceability of the remaining terms and
+     conditions.
+
+  c. No term or condition of this Public License will be waived and no
+     failure to comply consented to unless expressly agreed to by the
+     Licensor.
+
+  d. Nothing in this Public License constitutes or may be interpreted
+     as a limitation upon, or waiver of, any privileges and immunities
+     that apply to the Licensor or You, including from the legal
+     processes of any jurisdiction or authority.
+
+
+=======================================================================
+
+Creative Commons is not a party to its public
+licenses. Notwithstanding, Creative Commons may elect to apply one of
+its public licenses to material it publishes and in those instances
+will be considered the “Licensor.” The text of the Creative Commons
+public licenses is dedicated to the public domain under the CC0 Public
+Domain Dedication. Except for the limited purpose of indicating that
+material is shared under a Creative Commons public license or as
+otherwise permitted by the Creative Commons policies published at
+creativecommons.org/policies, Creative Commons does not authorize the
+use of the trademark "Creative Commons" or any other trademark or logo
+of Creative Commons without its prior written consent including,
+without limitation, in connection with any unauthorized modifications
+to any of its public licenses or any other arrangements,
+understandings, or agreements concerning use of licensed material. For
+the avoidance of doubt, this paragraph does not form part of the
+public licenses.
+
+Creative Commons may be contacted at creativecommons.org.
+
diff --git a/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/mask_rcnn_inception_resnet_v2_atrous_coco.md b/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/mask_rcnn_inception_resnet_v2_atrous_coco.md
index 2bc07a43c2b..627631ee48f 100644
--- a/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/mask_rcnn_inception_resnet_v2_atrous_coco.md
+++ b/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/mask_rcnn_inception_resnet_v2_atrous_coco.md
@@ -21,7 +21,7 @@ Mask R-CNN Inception Resnet V2 Atrous  is trained on COCO dataset and used for o
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x800x1365x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x800x800], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x800x1365], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -75,4 +75,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/model.yml b/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/model.yml
index 03fe6362d7b..2f8e629c995 100644
--- a/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/model.yml
+++ b/models/public/mask_rcnn_inception_resnet_v2_atrous_coco/model.yml
@@ -13,9 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Mask R-CNN Inception Resnet V2 Atrous trained on COCO dataset.
-  Used for object instance segmentation. For details see paper
-  <https://arxiv.org/pdf/1703.06870.pdf>.
+  Mask R-CNN Inception Resnet V2 Atrous  is trained on COCO dataset and used for object
+  instance segmentation. For details, see a paper <https://arxiv.org/pdf/1703.06870.pdf>.
 task_type: instance_segmentation
 files:
   - name: mask_rcnn_inception_resnet_v2_atrous_coco_2018_01_28.tar.gz
@@ -28,9 +27,9 @@ postprocessing:
     file: mask_rcnn_inception_resnet_v2_atrous_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,800,800,3]
+  - --input_shape=[1,800,1365,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/mask_rcnn_inception_resnet_v2_atrous_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/mask_rcnn_inception_resnet_v2_atrous_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/mask_rcnn_inception_v2_coco/mask_rcnn_inception_v2_coco.md b/models/public/mask_rcnn_inception_v2_coco/mask_rcnn_inception_v2_coco.md
index eb01f1da05f..823ecc4510d 100644
--- a/models/public/mask_rcnn_inception_v2_coco/mask_rcnn_inception_v2_coco.md
+++ b/models/public/mask_rcnn_inception_v2_coco/mask_rcnn_inception_v2_coco.md
@@ -22,7 +22,7 @@ For details, see a [paper](https://arxiv.org/pdf/1703.06870.pdf).
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x800x1365x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -34,7 +34,7 @@ Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x800x800], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x800x1365], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -81,4 +81,6 @@ bounding boxes.
 
 ## Legal Information
 
-[License](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mask_rcnn_inception_v2_coco/model.yml b/models/public/mask_rcnn_inception_v2_coco/model.yml
index bc15864b0ef..d710055926f 100644
--- a/models/public/mask_rcnn_inception_v2_coco/model.yml
+++ b/models/public/mask_rcnn_inception_v2_coco/model.yml
@@ -13,9 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Mask R-CNN Inception V2 trained on COCO dataset.
-  Used for object instance segmentation. For details see paper
-  <https://arxiv.org/pdf/1703.06870.pdf>.
+  Mask R-CNN Inception V2 trained on the COCO dataset. The model is used for object
+  instance segmentation.  For details, see a paper <https://arxiv.org/pdf/1703.06870.pdf>.
 task_type: instance_segmentation
 files:
   - name: mask_rcnn_inception_v2_coco_2018_01_28.tar.gz
@@ -28,9 +27,9 @@ postprocessing:
     file: mask_rcnn_inception_v2_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,800,800,3]
+  - --input_shape=[1,800,1365,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/mask_rcnn_inception_v2_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/mask_rcnn_inception_v2_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/mask_rcnn_resnet101_atrous_coco/mask_rcnn_resnet101_atrous_coco.md b/models/public/mask_rcnn_resnet101_atrous_coco/mask_rcnn_resnet101_atrous_coco.md
index 480354afaad..69530ab222e 100644
--- a/models/public/mask_rcnn_resnet101_atrous_coco/mask_rcnn_resnet101_atrous_coco.md
+++ b/models/public/mask_rcnn_resnet101_atrous_coco/mask_rcnn_resnet101_atrous_coco.md
@@ -21,7 +21,7 @@ Mask R-CNN Resnet101 Atrous is trained on COCO dataset and used for object insta
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x800x1365x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -33,7 +33,7 @@ Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x800x800], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x800x1365], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -75,4 +75,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mask_rcnn_resnet101_atrous_coco/model.yml b/models/public/mask_rcnn_resnet101_atrous_coco/model.yml
index f16026a6305..93b39a88877 100644
--- a/models/public/mask_rcnn_resnet101_atrous_coco/model.yml
+++ b/models/public/mask_rcnn_resnet101_atrous_coco/model.yml
@@ -13,9 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Mask R-CNN ResNet101 Atrous trained on COCO dataset.
-  Used for object instance segmentation. For details see paper
-  <https://arxiv.org/pdf/1703.06870.pdf>.
+  Mask R-CNN Resnet101 Atrous is trained on COCO dataset and used for object instance
+  segmentation. For details, see a paper <https://arxiv.org/pdf/1703.06870.pdf>.
 task_type: instance_segmentation
 files:
   - name: mask_rcnn_resnet101_atrous_coco_2018_01_28.tar.gz
@@ -28,9 +27,9 @@ postprocessing:
     file: mask_rcnn_resnet101_atrous_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,800,800,3]
+  - --input_shape=[1,800,1365,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/mask_rcnn_resnet101_atrous_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/mask_rcnn_resnet101_atrous_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/mask_rcnn_resnet50_atrous_coco/mask_rcnn_resnet50_atrous_coco.md b/models/public/mask_rcnn_resnet50_atrous_coco/mask_rcnn_resnet50_atrous_coco.md
index c67d16161ba..081d945b4e4 100644
--- a/models/public/mask_rcnn_resnet50_atrous_coco/mask_rcnn_resnet50_atrous_coco.md
+++ b/models/public/mask_rcnn_resnet50_atrous_coco/mask_rcnn_resnet50_atrous_coco.md
@@ -22,7 +22,7 @@ For details, see the [paper](https://arxiv.org/pdf/1703.06870.pdf).
 
 ### Original Model
 
-Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
+Image, name: `image_tensor`, shape: [1x800x1365x3], format: [BxHxWxC],
    where:
 
     - B - batch size
@@ -34,7 +34,7 @@ Image, name: `image_tensor`, shape: [1x800x800x3], format: [BxHxWxC],
 
 ### Converted Model
 
-1. Image, name: `image_tensor`, shape: [1x3x800x800], format: [BxCxHxW],
+1. Image, name: `image_tensor`, shape: [1x3x800x1365], format: [BxCxHxW],
    where:
 
     - B - batch size
@@ -76,4 +76,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mask_rcnn_resnet50_atrous_coco/model.yml b/models/public/mask_rcnn_resnet50_atrous_coco/model.yml
index b8536227dd1..a6415d67743 100644
--- a/models/public/mask_rcnn_resnet50_atrous_coco/model.yml
+++ b/models/public/mask_rcnn_resnet50_atrous_coco/model.yml
@@ -13,9 +13,8 @@
 # limitations under the License.
 
 description: >-
-  Mask R-CNN ResNet50 Atrous trained on COCO dataset.
-  Used for object instance segmentation. For details see paper
-  <https://arxiv.org/pdf/1703.06870.pdf>.
+  Mask R-CNN Resnet50 Atrous trained on COCO dataset. It is used for object instance
+  segmentation. For details, see the paper <https://arxiv.org/pdf/1703.06870.pdf>.
 task_type: instance_segmentation
 files:
   - name: mask_rcnn_resnet50_atrous_coco_2018_01_28.tar.gz
@@ -28,9 +27,9 @@ postprocessing:
     file: mask_rcnn_resnet50_atrous_coco_2018_01_28.tar.gz
 model_optimizer_args:
   - --reverse_input_channels
-  - --input_shape=[1,800,800,3]
+  - --input_shape=[1,800,1365,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/mask_rcnn_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/mask_rcnn_resnet50_atrous_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/mask_rcnn_resnet50_atrous_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/mobilenet-ssd/mobilenet-ssd.md b/models/public/mobilenet-ssd/mobilenet-ssd.md
index 708cb4a2f3e..4d33f9ed691 100644
--- a/models/public/mobilenet-ssd/mobilenet-ssd.md
+++ b/models/public/mobilenet-ssd/mobilenet-ssd.md
@@ -76,4 +76,29 @@ The array of detection summary info, name - `detection_out`,  shape - `1, 1, N,
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/chuanqi305/MobileNet-SSD/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2018 chuanqi305
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/mobilenet-ssd/model.yml b/models/public/mobilenet-ssd/model.yml
index 2c83d338add..ceaa45851a2 100644
--- a/models/public/mobilenet-ssd/model.yml
+++ b/models/public/mobilenet-ssd/model.yml
@@ -13,17 +13,17 @@
 # limitations under the License.
 
 description: >-
-  The `mobilenet-ssd` model is a Single-Shot multibox Detection (SSD) network
-  intended to perform object detection. This model is implemented using the Caffe\*
-  framework. For details about this model, check out the repository <https://github.com/chuanqi305/MobileNet-SSD>.
+  The "mobilenet-ssd" model is a Single-Shot multibox Detection (SSD) network intended
+  to perform object detection. This model is implemented using the Caffe* framework.
+  For details about this model, check out the repository <https://github.com/chuanqi305/MobileNet-SSD>.
 
-  The model input is a blob that consists of a single image of 1x3x300x300 in
-  BGR order, also like the `densenet-121` model. The BGR mean values need to be
-  subtracted as follows: [127.5, 127.5, 127.5] before passing the image blob into
-  the network. In addition, values must be divided by 0.007843.
+  The model input is a blob that consists of a single image of 1x3x300x300 in BGR
+  order, also like the "densenet-121" model. The BGR mean values need to be subtracted
+  as follows: [127.5, 127.5, 127.5] before passing the image blob into the network.
+  In addition, values must be divided by 0.007843.
 
-  The model output is a typical vector containing the tracked object data, as
-  previously described.
+  The model output is a typical vector containing the tracked object data, as previously
+  described.
 task_type: detection
 files:
   - name: mobilenet-ssd.prototxt
diff --git a/models/public/mobilenet-v1-0.25-128/mobilenet-v1-0.25-128.md b/models/public/mobilenet-v1-0.25-128/mobilenet-v1-0.25-128.md
index 24af02f94d5..25468dd2ba6 100644
--- a/models/public/mobilenet-v1-0.25-128/mobilenet-v1-0.25-128.md
+++ b/models/public/mobilenet-v1-0.25-128/mobilenet-v1-0.25-128.md
@@ -60,4 +60,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v1-0.25-128/model.yml b/models/public/mobilenet-v1-0.25-128/model.yml
index 26778a18486..535dfbcde8d 100644
--- a/models/public/mobilenet-v1-0.25-128/model.yml
+++ b/models/public/mobilenet-v1-0.25-128/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v1-0.25-128` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>
+  "mobilenet-v1-0.25-128" is one of MobileNets - small, low-latency, low-power models
+  parameterized to meet the resource constraints of a variety of use cases. They can
+  be built upon for classification, detection, embeddings and segmentation similar
+  to how other popular large scale models are used. For details, see paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet_v1_0.25_128.tgz
diff --git a/models/public/mobilenet-v1-0.50-160/mobilenet-v1-0.50-160.md b/models/public/mobilenet-v1-0.50-160/mobilenet-v1-0.50-160.md
index a78984b6258..a4f4e2efdab 100644
--- a/models/public/mobilenet-v1-0.50-160/mobilenet-v1-0.50-160.md
+++ b/models/public/mobilenet-v1-0.50-160/mobilenet-v1-0.50-160.md
@@ -60,4 +60,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v1-0.50-160/model.yml b/models/public/mobilenet-v1-0.50-160/model.yml
index 2da583e8bc9..4e0c1c41ef3 100644
--- a/models/public/mobilenet-v1-0.50-160/model.yml
+++ b/models/public/mobilenet-v1-0.50-160/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v1-0.50-160` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>
+  "mobilenet-v1-0.50-160" is one of MobileNets - small, low-latency, low-power models
+  parameterized to meet the resource constraints of a variety of use cases. They can
+  be built upon for classification, detection, embeddings and segmentation similar
+  to how other popular large scale models are used. For details, see paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet_v1_0.5_160.tgz
diff --git a/models/public/mobilenet-v1-0.50-224/mobilenet-v1-0.50-224.md b/models/public/mobilenet-v1-0.50-224/mobilenet-v1-0.50-224.md
index 02b26d3f045..382435ef2e9 100644
--- a/models/public/mobilenet-v1-0.50-224/mobilenet-v1-0.50-224.md
+++ b/models/public/mobilenet-v1-0.50-224/mobilenet-v1-0.50-224.md
@@ -60,4 +60,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v1-0.50-224/model.yml b/models/public/mobilenet-v1-0.50-224/model.yml
index c781b755a93..0271ecaf262 100644
--- a/models/public/mobilenet-v1-0.50-224/model.yml
+++ b/models/public/mobilenet-v1-0.50-224/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v1-0.50-224` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>
+  "mobilenet-v1-0.50-224" is one of MobileNets - small, low-latency, low-power models
+  parameterized to meet the resource constraints of a variety of use cases. They can
+  be built upon for classification, detection, embeddings and segmentation similar
+  to how other popular large scale models are used. For details, see paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet_v1_0.5_224.tgz
diff --git a/models/public/mobilenet-v1-1.0-224-tf/mobilenet-v1-1.0-224-tf.md b/models/public/mobilenet-v1-1.0-224-tf/mobilenet-v1-1.0-224-tf.md
index 36c592811f5..8ff45e9c452 100644
--- a/models/public/mobilenet-v1-1.0-224-tf/mobilenet-v1-1.0-224-tf.md
+++ b/models/public/mobilenet-v1-1.0-224-tf/mobilenet-v1-1.0-224-tf.md
@@ -59,4 +59,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v1-1.0-224-tf/model.yml b/models/public/mobilenet-v1-1.0-224-tf/model.yml
index 9772159f5f2..03c7a253d37 100644
--- a/models/public/mobilenet-v1-1.0-224-tf/model.yml
+++ b/models/public/mobilenet-v1-1.0-224-tf/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v1-1.0-224` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>
+  "mobilenet-v1-1.0-224" is one of MobileNets - small, low-latency, low-power models
+  parameterized to meet the resource constraints of a variety of use cases. They can
+  be built upon for classification, detection, embeddings and segmentation similar
+  to how other popular large scale models are used. For details, see the paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet_v1_1.0_224.tgz
diff --git a/models/public/mobilenet-v1-1.0-224/mobilenet-v1-1.0-224.md b/models/public/mobilenet-v1-1.0-224/mobilenet-v1-1.0-224.md
index 4a0f86e1d9b..ff6d01ea09a 100644
--- a/models/public/mobilenet-v1-1.0-224/mobilenet-v1-1.0-224.md
+++ b/models/public/mobilenet-v1-1.0-224/mobilenet-v1-1.0-224.md
@@ -60,4 +60,37 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/shicai/MobileNet-Caffe/26a8b8c0afb6114a07c1c9e4f550e4e0dd8cced1/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/shicai/MobileNet-Caffe/26a8b8c0afb6114a07c1c9e4f550e4e0dd8cced1/LICENSE):
+
+```
+BSD 3-Clause License
+
+Copyright (c) 2017-, Shicai Yang
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/mobilenet-v1-1.0-224/model.yml b/models/public/mobilenet-v1-1.0-224/model.yml
index 79116928ca1..b2a81645b19 100644
--- a/models/public/mobilenet-v1-1.0-224/model.yml
+++ b/models/public/mobilenet-v1-1.0-224/model.yml
@@ -13,11 +13,11 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v1-1.0-224` is one of MobileNet V1 architecture <https://arxiv.org/abs/1704.04861>
-  with the width multiplier 1.0 and resolution 224. It is small, low-latency,
-  low-power models parameterized to meet the resource constraints of a variety
-  of use cases. They can be built upon for classification, detection, embeddings
-  and segmentation similar to how other popular large scale models are used.
+  "mobilenet-v1-1.0-224" is one of MobileNet V1 architecture <https://arxiv.org/abs/1704.04861>
+  with the width multiplier 1.0 and resolution 224. It is small, low-latency, low-power
+  models parameterized to meet the resource constraints of a variety of use cases.
+  They can be built upon for classification, detection, embeddings and segmentation
+  similar to how other popular large scale models are used.
 task_type: classification
 files:
   - name: mobilenet-v1-1.0-224.prototxt
diff --git a/models/public/mobilenet-v2-1.0-224/mobilenet-v2-1.0-224.md b/models/public/mobilenet-v2-1.0-224/mobilenet-v2-1.0-224.md
index dd075de3d19..9222f34a605 100644
--- a/models/public/mobilenet-v2-1.0-224/mobilenet-v2-1.0-224.md
+++ b/models/public/mobilenet-v2-1.0-224/mobilenet-v2-1.0-224.md
@@ -61,4 +61,6 @@ Shape: [1,1001], format: [BxC],
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v2-1.0-224/model.yml b/models/public/mobilenet-v2-1.0-224/model.yml
index 43c881626d2..9839da275ad 100644
--- a/models/public/mobilenet-v2-1.0-224/model.yml
+++ b/models/public/mobilenet-v2-1.0-224/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v2-1.0-224` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>.
+  "mobilenet-v2-1.0-224" is one of MobileNet* models, which are small, low-latency,
+  low-power, and parameterized to meet the resource constraints of a variety of use
+  cases. They can be used for classification, detection, embeddings, and segmentation
+  like other popular large-scale models. For details, see the paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet_v2_1.0_224.tgz
diff --git a/models/public/mobilenet-v2-1.4-224/mobilenet-v2-1.4-224.md b/models/public/mobilenet-v2-1.4-224/mobilenet-v2-1.4-224.md
index 0786c7df7c5..5167d0facf7 100644
--- a/models/public/mobilenet-v2-1.4-224/mobilenet-v2-1.4-224.md
+++ b/models/public/mobilenet-v2-1.4-224/mobilenet-v2-1.4-224.md
@@ -58,4 +58,6 @@ Probabilities for all dataset classes (0 class is background). Probabilities are
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/mobilenet-v2-1.4-224/model.yml b/models/public/mobilenet-v2-1.4-224/model.yml
index 336e1b5b5b1..1091833133a 100644
--- a/models/public/mobilenet-v2-1.4-224/model.yml
+++ b/models/public/mobilenet-v2-1.4-224/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  `mobilenet-v2-1.4-224` is one of MobileNets - small, low-latency, low-power
-  models parameterized to meet the resource constraints of a variety of use cases.
-  They can be built upon for classification, detection, embeddings and segmentation
-  similar to how other popular large scale models are used. For details see paper
-  <https://arxiv.org/abs/1704.04861>
+  "mobilenet-v2-1.4-224" is one of MobileNets - small, low-latency, low-power models
+  parameterized to meet the resource constraints of a variety of use cases. They can
+  be built upon for classification, detection, embeddings and segmentation similar
+  to how other popular large scale models are used. For details, see the paper <https://arxiv.org/abs/1704.04861>.
 task_type: classification
 files:
   - name: mobilenet-v2-1.4-224.tar.gz
diff --git a/models/public/mobilenet-v2-pytorch/mobilenet-v2-pytorch.md b/models/public/mobilenet-v2-pytorch/mobilenet-v2-pytorch.md
index 04bac3c996e..f32aea67df8 100644
--- a/models/public/mobilenet-v2-pytorch/mobilenet-v2-pytorch.md
+++ b/models/public/mobilenet-v2-pytorch/mobilenet-v2-pytorch.md
@@ -77,4 +77,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/tonylins/pytorch-mobilenet-v2/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tonylins/pytorch-mobilenet-v2/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/mobilenet-v2-pytorch/model.yml b/models/public/mobilenet-v2-pytorch/model.yml
index 591943f0eca..d6c5ba7ac7a 100644
--- a/models/public/mobilenet-v2-pytorch/model.yml
+++ b/models/public/mobilenet-v2-pytorch/model.yml
@@ -36,7 +36,7 @@ files:
       $type: google_drive
       id: 1jlto6HRVD3ipNkAl1lNhDbkBp7HylaqR
 framework: pytorch
-pytorch_to_onnx:
+conversion_to_onnx_args:
   - --model-name=MobileNetV2
   - --model-path=$dl_dir
   - --weights=$dl_dir/mobilenet-v2.pth
diff --git a/models/public/mobilenet-v2/mobilenet-v2.md b/models/public/mobilenet-v2/mobilenet-v2.md
index 636135de3a9..0c3b45a3a94 100644
--- a/models/public/mobilenet-v2/mobilenet-v2.md
+++ b/models/public/mobilenet-v2/mobilenet-v2.md
@@ -62,4 +62,37 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/shicai/MobileNet-Caffe/26a8b8c0afb6114a07c1c9e4f550e4e0dd8cced1/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/shicai/MobileNet-Caffe/26a8b8c0afb6114a07c1c9e4f550e4e0dd8cced1/LICENSE):
+
+```
+BSD 3-Clause License
+
+Copyright (c) 2017-, Shicai Yang
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/mtcnn-o/model.yml b/models/public/mtcnn-o/model.yml
index 4833a81e31b..903e2b2527f 100644
--- a/models/public/mtcnn-o/model.yml
+++ b/models/public/mtcnn-o/model.yml
@@ -13,18 +13,18 @@
 # limitations under the License.
 
 description: >-
-  The `mtcnn-o` model is the third of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
+  The "mtcnn-o" model is the third of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
   group of models designed to perform face detection. Short for "Multi-task Cascaded
-  Convolutional Neural Network", it is implemented using the Caffe\* framework.
-  The "o" designation indicates that this model is the "output" network intended
-  to take the data returned from the "refine" `mtcnn-r` network, and transform
-  it into the final output data.  For details about this family of models, check
-  out the repository <https://github.com/DuinoDu/mtcnn>.
+  Convolutional Neural Network", it is implemented using the Caffe* framework. The
+  "o" designation indicates that this model is the "output" network intended to take
+  the data returned from the "refine" "mtcnn-r" network, and transform it into the
+  final output data.  For details about this family of models, check out the repository
+  <https://github.com/DuinoDu/mtcnn>.
 
-  The model input is a blob with a vector containing the refined face data, as
-  returned by the `mtcnn-r` model. The mean values need to be subtracted as follows:
-  [127.5, 127.5, 127.5] before passing the image blob into the network. In addition,
-  values must be divided by 0.0078125.
+  The model input is a blob with a vector containing the refined face data, as returned
+  by the "mtcnn-r" model. The mean values need to be subtracted as follows: [127.5,
+  127.5, 127.5] before passing the image blob into the network. In addition, values
+  must be divided by 0.0078125.
 
   The model output is a blob with a vector containing the output face data.
 task_type: detection
diff --git a/models/public/mtcnn-o/mtcnn-o.md b/models/public/mtcnn-o/mtcnn-o.md
index 06f1cd84566..504b8891d3e 100644
--- a/models/public/mtcnn-o/mtcnn-o.md
+++ b/models/public/mtcnn-o/mtcnn-o.md
@@ -64,4 +64,29 @@ Expected color order: `RGB`.
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2016 Kaipeng Zhang
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/mtcnn-p/model.yml b/models/public/mtcnn-p/model.yml
index 83456fcdd3b..4af1792306f 100644
--- a/models/public/mtcnn-p/model.yml
+++ b/models/public/mtcnn-p/model.yml
@@ -13,20 +13,20 @@
 # limitations under the License.
 
 description: >-
-  The `mtcnn-p` model is one of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
+  The "mtcnn-p" model is one of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
   group of models designed to perform face detection. Short for "Multi-task Cascaded
-  Convolutional Neural Network", it is implemented using the Caffe\* framework.
-  The "p" designation indicates that this model is the "proposal" network intended
-  to find the initial set of faces. For details about this family of models, check
-  out the repository <https://github.com/DuinoDu/mtcnn>.
+  Convolutional Neural Network", it is implemented using the Caffe* framework. The
+  "p" designation indicates that this model is the "proposal" network intended to
+  find the initial set of faces. For details about this family of models, check out
+  the repository <https://github.com/DuinoDu/mtcnn>.
 
   The model input is an image containing the data to be analyzed. The mean values
   need to be subtracted as follows: [127.5, 127.5, 127.5] before passing the image
   blob into the network. In addition, values must be divided by 0.0078125.
 
   The model output is a blob with a vector containing the first pass of face data.
-  If there are no faces detected, no further processing is needed. Otherwise,
-  you will typically use this output as input to the `mtcnn-r` model.
+  If there are no faces detected, no further processing is needed. Otherwise, you
+  will typically use this output as input to the "mtcnn-r" model.
 task_type: detection
 files:
   - name: mtcnn-p.prototxt
diff --git a/models/public/mtcnn-p/mtcnn-p.md b/models/public/mtcnn-p/mtcnn-p.md
index 2e69e45b1e1..48914fc4a2f 100644
--- a/models/public/mtcnn-p/mtcnn-p.md
+++ b/models/public/mtcnn-p/mtcnn-p.md
@@ -62,4 +62,29 @@ Expected color order: `RGB`.
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2016 Kaipeng Zhang
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/mtcnn-r/model.yml b/models/public/mtcnn-r/model.yml
index ed7d5552135..f9656fd3968 100644
--- a/models/public/mtcnn-r/model.yml
+++ b/models/public/mtcnn-r/model.yml
@@ -13,21 +13,21 @@
 # limitations under the License.
 
 description: >-
-  The `mtcnn-r` model is one of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
+  The "mtcnn-r" model is one of the mtcnn <https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf>
   group of models designed to perform face detection. Short for "Multi-task Cascaded
-  Convolutional Neural Network", it is implemented using the Caffe\* framework.
-  The "r" designation indicates that this model is the "refine" network intended
-  to refine the data returned as output from the "proposal" `mtcnn-p` network.
-  For details about this family of models, check out the repository <https://github.com/DuinoDu/mtcnn>.
+  Convolutional Neural Network", it is implemented using the Caffe* framework. The
+  "r" designation indicates that this model is the "refine" network intended to refine
+  the data returned as output from the "proposal" "mtcnn-p" network. For details about
+  this family of models, check out the repository <https://github.com/DuinoDu/mtcnn>.
 
   The model input is a blob with a vector containing the first pass of face data,
-  as returned by the `mtcnn-p` model. The mean values need to be subtracted as
-  follows: [127.5, 127.5, 127.5] before passing the image blob into the network.
-  In addition, values must be divided by 0.0078125.
+  as returned by the "mtcnn-p" model. The mean values need to be subtracted as follows:
+  [127.5, 127.5, 127.5] before passing the image blob into the network. In addition,
+  values must be divided by 0.0078125.
 
-  The model output is a blob with a vector containing the refined face data. If
-  there are no faces detected by the refine pass, no further processing is needed.
-  Otherwise, you will typically use this output as input to the `mtcnn-o` model.
+  The model output is a blob with a vector containing the refined face data. If there
+  are no faces detected by the refine pass, no further processing is needed. Otherwise,
+  you will typically use this output as input to the "mtcnn-o" model.
 task_type: detection
 files:
   - name: mtcnn-r.prototxt
diff --git a/models/public/mtcnn-r/mtcnn-r.md b/models/public/mtcnn-r/mtcnn-r.md
index e215855d4df..fc3eb9f0a9f 100644
--- a/models/public/mtcnn-r/mtcnn-r.md
+++ b/models/public/mtcnn-r/mtcnn-r.md
@@ -62,4 +62,29 @@ Expected color order: `RGB`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/DuinoDu/mtcnn/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) 2016 Kaipeng Zhang
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-densenet-121-0.125/model.yml b/models/public/octave-densenet-121-0.125/model.yml
index 664edd19bdc..b1b4db8a12d 100644
--- a/models/public/octave-densenet-121-0.125/model.yml
+++ b/models/public/octave-densenet-121-0.125/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-densenet-121-0.125` model is a modification of `densenet-121` from
-  this paper <https://arxiv.org/pdf/1608.06993> with octave convolutions from
-  Drop an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks
-  with Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.125`.
-  As origin, it's designed to perform image classification. For details about
-  family of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-densenet-121-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-densenet-121-0.125" model is a modification of "densenet-121" <https://arxiv.org/pdf/1608.06993>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.125". Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a01_densenet-121_alpha-0.125.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a01_densenet-121_alpha-0.125/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a01_densenet-121_alpha-0.125/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-densenet-121-0.125/octave-densenet-121-0.125.md b/models/public/octave-densenet-121-0.125/octave-densenet-121-0.125.md
index 05e30d3ffad..03bf3cace29 100644
--- a/models/public/octave-densenet-121-0.125/octave-densenet-121-0.125.md
+++ b/models/public/octave-densenet-121-0.125/octave-densenet-121-0.125.md
@@ -67,4 +67,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnet-101-0.125/model.yml b/models/public/octave-resnet-101-0.125/model.yml
index 84208876a49..914470610cf 100644
--- a/models/public/octave-resnet-101-0.125/model.yml
+++ b/models/public/octave-resnet-101-0.125/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnet-101-0.125` model is a modification of `resnet-101` from this
-  paper <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.125`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-resnet-101-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-resnet-101-0.125" model is a modification of "resnet-101" <https://arxiv.org/pdf/1512.03385.pdf>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.125".  Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a06_resnet-101_alpha-0.125.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a06_resnet-101_alpha-0.125/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a06_resnet-101_alpha-0.125/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnet-101-0.125/octave-resnet-101-0.125.md b/models/public/octave-resnet-101-0.125/octave-resnet-101-0.125.md
index 766c83b8168..8e1da527524 100644
--- a/models/public/octave-resnet-101-0.125/octave-resnet-101-0.125.md
+++ b/models/public/octave-resnet-101-0.125/octave-resnet-101-0.125.md
@@ -67,4 +67,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnet-200-0.125/model.yml b/models/public/octave-resnet-200-0.125/model.yml
index a81ad0cdc53..3b275849d9e 100644
--- a/models/public/octave-resnet-200-0.125/model.yml
+++ b/models/public/octave-resnet-200-0.125/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnet-200-0.125` model is a modification of `resnet-200` from this
-  paper <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.125`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-resnet-200-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-resnet-200-0.125" model is a modification of "resnet-200" <https://arxiv.org/pdf/1512.03385.pdf>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.125". Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a08_resnet-200_alpha-0.125.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a08_resnet-200_alpha-0.125/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a08_resnet-200_alpha-0.125/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnet-200-0.125/octave-resnet-200-0.125.md b/models/public/octave-resnet-200-0.125/octave-resnet-200-0.125.md
index 6b11a4c6068..7c028870209 100644
--- a/models/public/octave-resnet-200-0.125/octave-resnet-200-0.125.md
+++ b/models/public/octave-resnet-200-0.125/octave-resnet-200-0.125.md
@@ -66,4 +66,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnet-26-0.25/model.yml b/models/public/octave-resnet-26-0.25/model.yml
index 4af491dae96..b870e4815ae 100644
--- a/models/public/octave-resnet-26-0.25/model.yml
+++ b/models/public/octave-resnet-26-0.25/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnet-26-0.25` model is a modification of `resnet-26` from this
-  paper <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.25`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-resnet-26-0.25` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-resnet-26-0.25" model is a modification of "resnet-26" <https://arxiv.org/pdf/1512.03385.pdf>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.25". Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a02_resnet-26_alpha-0.250.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a02_resnet-26_alpha-0.250/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a02_resnet-26_alpha-0.250/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnet-26-0.25/octave-resnet-26-0.25.md b/models/public/octave-resnet-26-0.25/octave-resnet-26-0.25.md
index ce171512bc8..7ad6f4d9361 100644
--- a/models/public/octave-resnet-26-0.25/octave-resnet-26-0.25.md
+++ b/models/public/octave-resnet-26-0.25/octave-resnet-26-0.25.md
@@ -67,4 +67,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnet-50-0.125/model.yml b/models/public/octave-resnet-50-0.125/model.yml
index fb28d3d658b..8728aaa63c9 100644
--- a/models/public/octave-resnet-50-0.125/model.yml
+++ b/models/public/octave-resnet-50-0.125/model.yml
@@ -13,21 +13,20 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnet-50-0.125` model is a modification of `resnet-50` from this
-  paper <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.125`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
+  The "octave-resnet-50-0.125" model is a modification of "resnet-50" from this paper
+  <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop an Octave:
+  Reducing Spatial Redundancy in Convolutional Neural Networks with Octave Convolution
+  <https://arxiv.org/abs/1904.05049> with "alpha=0.125". The model is originally designed
+  for image classification. For details about family of Octave Convolution models,
+  check out the  repository <https://github.com/facebookresearch/OctConv>.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
+  The model input is a blob that consists of a single image of 1x3x224x224 in RGB
+  order. The RGB mean values need to be subtracted as follows: [124,117,104] before
+  passing the image blob into the network. In addition, values must be divided by
+  0.0167.
 
-  The model output for `octave-resnet-50-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The model output for "octave-resnet-50-0.125" is the typical object classifier output
+  for the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: a03_resnet-50_alpha-0.125.tar
@@ -46,6 +45,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a03_resnet-50_alpha-0.125/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a03_resnet-50_alpha-0.125/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnet-50-0.125/octave-resnet-50-0.125.md b/models/public/octave-resnet-50-0.125/octave-resnet-50-0.125.md
index 2d987de7ddc..ed0f82f6265 100644
--- a/models/public/octave-resnet-50-0.125/octave-resnet-50-0.125.md
+++ b/models/public/octave-resnet-50-0.125/octave-resnet-50-0.125.md
@@ -66,4 +66,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnext-101-0.25/model.yml b/models/public/octave-resnext-101-0.25/model.yml
index 985c412b12a..23767efbb90 100644
--- a/models/public/octave-resnext-101-0.25/model.yml
+++ b/models/public/octave-resnext-101-0.25/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnext-101-0.25` model is a modification of `resnext-101` from
-  this paper <https://arxiv.org/abs/1611.05431> with octave convolutions from
-  Drop an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks
-  with Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.25`.
-  As origin, it's designed to perform image classification. For details about
-  family of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-resnext-101-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-resnext-101-0.25" model is a modification of "resnext-101" <https://arxiv.org/abs/1611.05431>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.25". Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a07_resnext-101_32x4d_alpha-0.250.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a07_resnext-101_32x4d_alpha-0.250/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a07_resnext-101_32x4d_alpha-0.250/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnext-101-0.25/octave-resnext-101-0.25.md b/models/public/octave-resnext-101-0.25/octave-resnext-101-0.25.md
index b1f4fa062a5..f0080a01cae 100644
--- a/models/public/octave-resnext-101-0.25/octave-resnext-101-0.25.md
+++ b/models/public/octave-resnext-101-0.25/octave-resnext-101-0.25.md
@@ -66,4 +66,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-resnext-50-0.25/model.yml b/models/public/octave-resnext-50-0.25/model.yml
index 6faf4c207ef..65c174f1c1e 100644
--- a/models/public/octave-resnext-50-0.25/model.yml
+++ b/models/public/octave-resnext-50-0.25/model.yml
@@ -13,21 +13,12 @@
 # limitations under the License.
 
 description: >-
-  The `octave-resnext-50-0.25` model is a modification of `resnext-50` from this
-  paper <https://arxiv.org/abs/1611.05431> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.25`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
-
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
-
-  The model output for `octave-resnext-50-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The "octave-resnext-50-0.25" model is a modification of "resnext-50" <https://arxiv.org/abs/1611.05431>
+  with Octave convolutions from Drop an Octave: Reducing Spatial Redundancy in Convolutional
+  Neural Networks with Octave Convolution <https://arxiv.org/abs/1904.05049> with
+  "alpha=0.25". Like the original model, this model is designed for image classification.
+  For details about family of Octave Convolution models, check out the repository
+  <https://github.com/facebookresearch/OctConv>.
 task_type: classification
 files:
   - name: a04_resnext-50_32x4d_alpha-0.250.tar
@@ -46,6 +37,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a04_resnext-50_32x4d_alpha-0.250/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a04_resnext-50_32x4d_alpha-0.250/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-resnext-50-0.25/octave-resnext-50-0.25.md b/models/public/octave-resnext-50-0.25/octave-resnext-50-0.25.md
index 17d3c372eef..57cc0f733e0 100644
--- a/models/public/octave-resnext-50-0.25/octave-resnext-50-0.25.md
+++ b/models/public/octave-resnext-50-0.25/octave-resnext-50-0.25.md
@@ -66,4 +66,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/octave-se-resnet-50-0.125/model.yml b/models/public/octave-se-resnet-50-0.125/model.yml
index af2404a321b..f1cec1283f3 100644
--- a/models/public/octave-se-resnet-50-0.125/model.yml
+++ b/models/public/octave-se-resnet-50-0.125/model.yml
@@ -13,21 +13,20 @@
 # limitations under the License.
 
 description: >-
-  The `octave-se-resnet-50-0.125` model is a modification of `se-resnet-50` from this
-  paper <https://arxiv.org/pdf/1512.03385.pdf> with octave convolutions from Drop
-  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with
-  Octave Convolution <https://arxiv.org/abs/1904.05049> with `alpha=0.125`. As
-  origin, it's designed to perform image classification. For details about family
-  of octave convolution models, check out the repository <https://github.com/facebookresearch/OctConv>.
+  The "octave-se-resnet-50-0.125" model is a modification of "se-resnet-50" from this
+  paper <https://arxiv.org/pdf/1709.01507.pdf> with octave convolutions from Drop
+  an Octave: Reducing Spatial Redundancy in Convolutional Neural Networks with Octave
+  Convolution <https://arxiv.org/abs/1904.05049> with "alpha=0.125". As origin, it's
+  designed to perform image classification. For details about family of octave convolution
+  models, check out the repository <https://github.com/facebookresearch/OctConv>.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  RGB order. The RGB mean values need to be subtracted as follows: [124,117,104]
-  before passing the image blob into the network. In addition, values must be
-  divided by 0.0167.
+  The model input is a blob that consists of a single image of 1x3x224x224 in RGB
+  order. The RGB mean values need to be subtracted as follows: [124,117,104] before
+  passing the image blob into the network. In addition, values must be divided by
+  0.0167.
 
-  The model output for `octave-se-resnet-50-0.125` is the typical object classifier
-  output for the 1000 different classifications matching those in the ImageNet
-  database.
+  The model output for "octave-se-resnet-50-0.125" is the typical object classifier
+  output for the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: a05_se-resnet-50_alpha-0.125.tar
@@ -46,6 +45,5 @@ model_optimizer_args:
   - --input=data
   - --output=softmax
   - --input_model=$dl_dir/a05_se-resnet-50_alpha-0.125/checkpoint-0-0000.params
-  - --input_symbol=$dl_dir/a05_se-resnet-50_alpha-0.125/checkpoint-0-symbol.json
 framework: mxnet
 license: https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE
diff --git a/models/public/octave-se-resnet-50-0.125/octave-se-resnet-50-0.125.md b/models/public/octave-se-resnet-50-0.125/octave-se-resnet-50-0.125.md
index b26d2e0a9d0..4128f34056f 100644
--- a/models/public/octave-se-resnet-50-0.125/octave-se-resnet-50-0.125.md
+++ b/models/public/octave-se-resnet-50-0.125/octave-se-resnet-50-0.125.md
@@ -66,4 +66,29 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/facebookresearch/OctConv/master/LICENSE):
+
+```
+MIT License
+
+Copyright (c) Facebook, Inc. and its affiliates.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/resnet-101/resnet-101.md b/models/public/resnet-101/resnet-101.md
index 30a2c39e35c..abaf012a085 100644
--- a/models/public/resnet-101/resnet-101.md
+++ b/models/public/resnet-101/resnet-101.md
@@ -62,4 +62,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE):
+
+```
+The MIT License (MIT)
+
+Copyright (c) 2016 Shaoqing Ren
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/resnet-152/resnet-152.md b/models/public/resnet-152/resnet-152.md
index e9a6a69c0e0..b86c4cb36c2 100644
--- a/models/public/resnet-152/resnet-152.md
+++ b/models/public/resnet-152/resnet-152.md
@@ -64,4 +64,29 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE):
+
+```
+The MIT License (MIT)
+
+Copyright (c) 2016 Shaoqing Ren
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/resnet-18-pytorch/model.yml b/models/public/resnet-18-pytorch/model.yml
new file mode 100644
index 00000000000..5a38a34c37f
--- /dev/null
+++ b/models/public/resnet-18-pytorch/model.yml
@@ -0,0 +1,48 @@
+# Copyright (c) 2020 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Resnet 18 is image classification model pretrained on ImageNet dataset. This
+  is PyTorch implementation based on architecture described in paper "Deep Residual
+  Learning for Image Recognition" <https://arxiv.org/pdf/1512.03385> in TorchVision
+  package (see here <https://github.com/pytorch/vision>).
+
+  The model input is a blob that consists of a single image of "1x3x224x224" in
+  RGB order.
+
+  The model output is typical object classifier for the 1000 different classifications
+  matching with those in the ImageNet database.
+task_type: classification
+files:
+  - name: resnet18-5c106cde.pth
+    sha256: 5c106cde386e87d4033832f2996f5493238eda96ccf559d1d62760c4de0613f8
+    size: 46827520
+    source: https://download.pytorch.org/models/resnet18-5c106cde.pth
+framework: pytorch
+conversion_to_onnx_args:
+  - --model-name=resnet18
+  - --weights=$dl_dir/resnet18-5c106cde.pth
+  - --from-torchvision
+  - --input-shape=1,3,224,224
+  - --output-file=$conv_dir/resnet-18-pytorch.onnx
+  - --input-names=data
+  - --output-names=prob
+model_optimizer_args:
+  - --input=data
+  - --mean_values=data[123.675,116.28,103.53]
+  - --scale_values=data[58.395,57.12,57.375]
+  - --reverse_input_channels
+  - --output=prob
+  - --input_model=$conv_dir/resnet-18-pytorch.onnx
+license: https://raw.githubusercontent.com/pytorch/vision/master/LICENSE
diff --git a/models/public/resnet-18-pytorch/resnet-18-pytorch.md b/models/public/resnet-18-pytorch/resnet-18-pytorch.md
new file mode 100644
index 00000000000..6e110142c6f
--- /dev/null
+++ b/models/public/resnet-18-pytorch/resnet-18-pytorch.md
@@ -0,0 +1,107 @@
+# resnet-18-pytorch
+
+## Use Case and High-Level Description
+
+Resnet 18 is image classification model pretrained on ImageNet dataset. This
+is PyTorch implementation based on architecture described in paper ["Deep Residual
+Learning for Image Recognition"](https://arxiv.org/pdf/1512.03385) in TorchVision
+package (see [here](https://github.com/pytorch/vision)).
+
+The model input is a blob that consists of a single image of "1x3x224x224"
+in RGB order.
+
+The model output is typical object classifier for the 1000 different classifications
+matching with those in the ImageNet database.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 3.637         |
+| MParams           | 11.68         |
+| Source framework  | PyTorch\*     |
+
+## Accuracy
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `RGB`. 
+Mean values - [123.675,116.28,103.53], scale values - [58.395,57.12,57.375].
+
+### Converted model
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - Predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/pytorch/vision/master/LICENSE):
+
+```
+BSD 3-Clause License
+
+Copyright (c) Soumith Chintala 2016,
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/resnet-50-caffe2/model.yml b/models/public/resnet-50-caffe2/model.yml
new file mode 100644
index 00000000000..80c361e3efe
--- /dev/null
+++ b/models/public/resnet-50-caffe2/model.yml
@@ -0,0 +1,43 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This is a Caffe2* version of "resnet-50" model, designed to perform image classification.
+  This model was converted from Caffe* to Caffe2* format.  For details see repository
+  <https://github.com/caffe2/models/tree/master/resnet50>, paper <https://arxiv.org/pdf/1512.03385.pdf>.
+task_type: classification
+files:
+  - name: predict_net.pb
+    size: 31649
+    sha256: 657081428cd8a8d9f1a6b20a8b6dba51725d3fc1eaabf0f19747a3b843e18a16
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/resnet50/predict_net.pb
+  - name: init_net.pb
+    size: 128070759
+    sha256: 97046c44ecd15b3c8806f609a15d0cc52af7bdc8aa19c720f8a1f6abe68e9a74
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/resnet50/init_net.pb
+framework: caffe2
+conversion_to_onnx_args:
+  - --model-path=$dl_dir/predict_net.pb
+  - --model-name=resnet-50-caffe2
+  - --weights=$dl_dir/init_net.pb
+  - --input-shape=1,3,224,224
+  - --input-names=gpu_0/data
+  - --output-file=$conv_dir/resnet-50-caffe2.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,224,224]
+  - --input=gpu_0/data
+  - --mean_values=gpu_0/data[103.53,116.28,123.675]
+  - --scale_values=gpu_0/data[57.375,57.12,58.395]
+  - --input_model=$conv_dir/resnet-50-caffe2.onnx
+license: https://raw.githubusercontent.com/caffe2/models/master/LICENSE
diff --git a/models/public/resnet-50-caffe2/resnet-50-caffe2.md b/models/public/resnet-50-caffe2/resnet-50-caffe2.md
new file mode 100644
index 00000000000..5d928735f54
--- /dev/null
+++ b/models/public/resnet-50-caffe2/resnet-50-caffe2.md
@@ -0,0 +1,70 @@
+# resnet-50-caffe2
+
+## Use Case and High-Level Description
+
+This is a Caffe2\* version of `resnet-50` model, designed to perform image classification.
+This model was converted from Caffe\* to Caffe2\* format. 
+For details see repository <https://github.com/caffe2/models/tree/master/resnet50>,
+paper <https://arxiv.org/pdf/1512.03385.pdf>.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 8.216         |
+| MParams           | 25.53         |
+| Source framework  | Caffe2\*      |
+
+## Accuracy
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `gpu_0/data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`. 
+Mean values - [103.53,116.28,123.675], scale values - [57.375,57.12,58.395].
+
+### Converted model
+
+Image, name - `gpu_0/data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `gpu_0/softmax`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `gpu_0/softmax`,  shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/caffe2/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/resnet-50-pytorch/model.yml b/models/public/resnet-50-pytorch/model.yml
index 1c8bc24c6a4..64a35ba355c 100644
--- a/models/public/resnet-50-pytorch/model.yml
+++ b/models/public/resnet-50-pytorch/model.yml
@@ -13,13 +13,13 @@
 # limitations under the License.
 
 description: >-
-  Resnet 50 is image classification model pretrained on ImageNet dataset. This
-  is PyTorch implementation based on architecture described in paper "Deep Residual
-  Learning for Image Recognition" <https://arxiv.org/pdf/1512.03385> in TorchVision
-  package (see here <https://github.com/pytorch/vision>).
+  Resnet 50 is image classification model pretrained on ImageNet dataset. This is
+  PyTorch implementation based on architecture described in paper "Deep Residual Learning
+  for Image Recognition" <https://arxiv.org/pdf/1512.03385> in TorchVision package
+  (see here <https://github.com/pytorch/vision>).
 
-  The model input is a blob that consists of a single image of "1x3x224x224" in
-  RGB order.
+  The model input is a blob that consists of a single image of "1x3x224x224" in RGB
+  order. 
 
   The model output is typical object classifier for the 1000 different classifications
   matching with those in the ImageNet database.
@@ -30,7 +30,7 @@ files:
     size: 102502400
     source: https://download.pytorch.org/models/resnet50-19c8e357.pth
 framework: pytorch
-pytorch_to_onnx:
+conversion_to_onnx_args:
   - --model-name=resnet50
   - --weights=$dl_dir/resnet50-19c8e357.pth
   - --from-torchvision
diff --git a/models/public/resnet-50-pytorch/resnet-50-pytorch.md b/models/public/resnet-50-pytorch/resnet-50-pytorch.md
index 56167b3231e..4c0fc2a0527 100644
--- a/models/public/resnet-50-pytorch/resnet-50-pytorch.md
+++ b/models/public/resnet-50-pytorch/resnet-50-pytorch.md
@@ -71,4 +71,37 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/pytorch/vision/master/LICENSE)
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/pytorch/vision/master/LICENSE):
+
+```
+BSD 3-Clause License
+
+Copyright (c) Soumith Chintala 2016,
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+* Redistributions of source code must retain the above copyright notice, this
+  list of conditions and the following disclaimer.
+
+* Redistributions in binary form must reproduce the above copyright notice,
+  this list of conditions and the following disclaimer in the documentation
+  and/or other materials provided with the distribution.
+
+* Neither the name of the copyright holder nor the names of its
+  contributors may be used to endorse or promote products derived from
+  this software without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/resnet-50-tf/freeze_saved_model.py b/models/public/resnet-50-tf/freeze_saved_model.py
new file mode 100644
index 00000000000..c6a3452e54a
--- /dev/null
+++ b/models/public/resnet-50-tf/freeze_saved_model.py
@@ -0,0 +1,43 @@
+import argparse
+import tensorflow.compat.v1 as tf
+
+from tensorflow.python.framework import graph_io
+from tensorflow.python.tools import optimize_for_inference_lib
+
+def parse_args():
+    """Parse input arguments"""
+
+    parser = argparse.ArgumentParser(description='Freeze saved model')
+
+    parser.add_argument('--saved_model_dir', type=str, required=True,
+                        help='Path to saved model directory.')
+    parser.add_argument('--save_file', type=str, required=True,
+                        help='Path to resulting frozen model.')
+    return parser.parse_args()
+
+def freeze(saved_model_dir, input_nodes, output_nodes, save_file):
+    graph_def = tf.Graph()
+    with tf.Session(graph=graph_def) as sess:
+        tf.saved_model.loader.load(sess, [tf.saved_model.tag_constants.SERVING], saved_model_dir)
+        frozen_graph_def = tf.graph_util.convert_variables_to_constants(
+            sess,
+            sess.graph_def,
+            output_nodes
+        )
+        frozen_graph_def = optimize_for_inference_lib.optimize_for_inference(
+            frozen_graph_def,
+            input_nodes,
+            output_nodes,
+            tf.float32.as_datatype_enum
+        )
+        with open(save_file, 'wb') as f:
+            f.write(frozen_graph_def.SerializeToString())
+
+def main():
+    args = parse_args()
+    input_nodes = ['map/TensorArrayStack/TensorArrayGatherV3']
+    output_nodes = ['softmax_tensor']
+    freeze(args.saved_model_dir, input_nodes, output_nodes, args.save_file)
+
+if __name__ == '__main__':
+    main()
diff --git a/models/public/resnet-50-tf/model.yml b/models/public/resnet-50-tf/model.yml
new file mode 100644
index 00000000000..0838075152d
--- /dev/null
+++ b/models/public/resnet-50-tf/model.yml
@@ -0,0 +1,33 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  resnet-50-tf is a TensorFlow\* implementation of ResNet-50 - an image classification model
+  pretrained on the ImageNet dataset. For details see paper <https://arxiv.org/pdf/1512.03385.pdf>,
+  repository <https://github.com/tensorflow/models/tree/master/official/r1/resnet>.
+task_type: classification
+files:
+  - name: resnet_v1-50.pb
+    size: 102170160
+    sha256: 7c186a471a30682cdee02b246eeb0bfd93fc71d9fa53834d69f8101e664d12f8
+    source: https://download.01.org/opencv/public_models/012020/resnet-50-tf/resnet_v1-50.pb
+model_optimizer_args:
+  - --input_shape=[1,224,224,3]
+  - --mean_values=[123.68,116.78,103.94]
+  - --input=map/TensorArrayStack/TensorArrayGatherV3
+  - --output=softmax_tensor
+  - --input_model=$dl_dir/resnet_v1-50.pb
+  - --reverse_input_channels
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/models/master/LICENSE
diff --git a/models/public/resnet-50-tf/resnet-50-tf.md b/models/public/resnet-50-tf/resnet-50-tf.md
new file mode 100644
index 00000000000..7717b6a7206
--- /dev/null
+++ b/models/public/resnet-50-tf/resnet-50-tf.md
@@ -0,0 +1,85 @@
+# resnet-50-tf
+
+## Use Case and High-Level Description
+
+`resnet-50-tf` is a TensorFlow\* implementation of ResNet-50 - an image classification model
+pretrained on the ImageNet dataset. Originally redistributed in Saved model format,
+converted to frozen graph using `tf.graph_util` module.
+For details see [paper](https://arxiv.org/pdf/1512.03385.pdf),
+[repository](https://github.com/tensorflow/models/tree/master/official/r1/resnet).
+
+### Steps to Reproduce Conversion to Frozen Graph
+
+1. Install TensorFlow\*, version 1.14.0.
+2. Download [pretrained weights](http://download.tensorflow.org/models/official/20181001_resnet/savedmodels/resnet_v1_fp32_savedmodel_NHWC_jpg.tar.gz)
+3. Run example conversion code, avaliable at [freeze_saved_model.py](./freeze_saved_model.py)
+```sh
+python3 freeze_saved_model.py --saved_model_dir path/to/downloaded/saved_model --save_file path/to/resulting/frozen_graph.pb
+```
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 8.2164        |
+| MParams           | 25.53         |
+| Source framework  | TensorFlow\*  |
+
+## Accuracy
+
+| Metric | Original model | Converted model |
+| ------ | -------------- | --------------- |
+| Top 1  | 76.45          | 76.17           |
+| Top 5  | 93.05          | 92.98           |
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name: `map/TensorArrayStack/TensorArrayGatherV3`,  shape: `1,224,224,3`, format is `B,H,W,C` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `RGB`. 
+Mean values: [123.68,116.78,103.94].
+
+### Converted Model
+
+Image, name: `map/TensorArrayStack/TensorArrayGatherV3`,  shape: `1,224,224,3`, format is `B,H,W,C` where:
+
+- `B` - batch size
+- `H` - height
+- `W` - width
+- `C` - channel
+
+Channel order is `BGR`.
+
+## Output
+
+### Original Model
+
+Object classifier according to ImageNet classes, name: `softmax_tensor`,  shape: `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+### Converted Model
+
+Object classifier according to ImageNet classes, name: `softmax_tensor`,  shape: `1,1001`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/resnet-50/resnet-50.md b/models/public/resnet-50/resnet-50.md
index 3b59ea56509..d445e0e126e 100644
--- a/models/public/resnet-50/resnet-50.md
+++ b/models/public/resnet-50/resnet-50.md
@@ -62,4 +62,29 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/KaimingHe/deep-residual-networks/master/LICENSE):
+
+```
+The MIT License (MIT)
+
+Copyright (c) 2016 Shaoqing Ren
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+```
diff --git a/models/public/rfcn-resnet101-coco-tf/model.yml b/models/public/rfcn-resnet101-coco-tf/model.yml
new file mode 100644
index 00000000000..6d29437a9c5
--- /dev/null
+++ b/models/public/rfcn-resnet101-coco-tf/model.yml
@@ -0,0 +1,37 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  R-FCN Resnet-101 model, pretrained on COCO* dataset. Used for object detection.
+  For details, see the paper <https://arxiv.org/pdf/1605.06409.pdf>.
+task_type: detection
+files:
+  - name: rfcn_resnet101_coco_2018_01_28.tar.gz
+    size: 652955004
+    sha256: e10d71260515cc0240d53ea8fc9e61669bc10c2df5e67ace682832113ac17205
+    source: http://download.tensorflow.org/models/object_detection/rfcn_resnet101_coco_2018_01_28.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: rfcn_resnet101_coco_2018_01_28.tar.gz
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,600,600,3]
+  - --input=image_tensor
+  - --output=detection_scores,detection_boxes,num_detections
+  - --transformations_config=$mo_dir/extensions/front/tf/rfcn_support.json
+  - --tensorflow_object_detection_api_pipeline_config=$dl_dir/rfcn_resnet101_coco_2018_01_28/pipeline.config
+  - --input_model=$dl_dir/rfcn_resnet101_coco_2018_01_28/frozen_inference_graph.pb
+framework: tf
+license: https://raw.githubusercontent.com/tensorflow/models/master/LICENSE
diff --git a/models/public/rfcn-resnet101-coco-tf/rfcn-resnet101-coco-tf.md b/models/public/rfcn-resnet101-coco-tf/rfcn-resnet101-coco-tf.md
new file mode 100644
index 00000000000..d3384a67bcf
--- /dev/null
+++ b/models/public/rfcn-resnet101-coco-tf/rfcn-resnet101-coco-tf.md
@@ -0,0 +1,78 @@
+# rfcn-resnet101-coco-tf
+
+## Use Case and High-Level Description
+
+R-FCN Resnet-101 model, pretrained on COCO\* dataset. Used for object detection. For details, see the [paper](https://arxiv.org/pdf/1605.06409.pdf).
+
+## Example
+
+## Specification
+
+| Metric                          | Value                                     |
+|---------------------------------|-------------------------------------------|
+| Type                            | Object detection                          |
+| GFlops                          | 53.462                                    |
+| MParams                         | 171.85                                    |
+| Source framework                | TensorFlow\*                              |
+
+## Performance
+
+## Input
+
+### Original Model
+
+Image, name: `image_tensor`, shape: [1x600x600x3], format: [BxHxWxC],
+   where:
+
+    - B - batch size
+    - H - image height
+    - W - image width
+    - C - number of channels
+
+   Expected color order: RGB.
+
+### Converted Model
+
+1. Image, name: `image_tensor`, shape: [1x3x600x600], format: [BxCxHxW],
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order: BGR.
+
+2. Information of input image size, name: `image_info`, shape: [1x3], format: [BxC],
+   where:
+
+    - B - batch size
+    - C - vector of 3 values in format [H,W,S], where H is an image height, W is an image width, S is an image scale factor (usually 1)
+
+## Output
+
+### Original Model
+
+1. Classifier, name: `detection_classes`. Contains predicted bounding boxes classes in a range [1, 91]. The model was trained on the Microsoft\* COCO dataset version with 90 categories of objects.
+2. Probability, name: `detection_scores`. Contains probability of detected bounding boxes.
+3. Detection box, name: `detection_boxes`. Contains detection boxes coordinates in a format `[y_min, x_min, y_max, x_max]`, where (`x_min`, `y_min`)  are coordinates of the top left corner, (`x_max`, `y_max`) are coordinates of the right bottom corner. Coordinates are rescaled to input image size.
+4. Detections number, name: `num_detections`. Contains the number of predicted detection boxes.
+
+### Converted Model
+
+The array of summary detection information, name: `detection_output`, shape: [1, 1, N, 7], where N is the number of detected
+bounding boxes. For each detection, the description has the format:
+[`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`],
+    where:
+
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner (coordinates stored in normalized format, in range [0, 1])
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner  (coordinates stored in normalized format, in range [0, 1])
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/se-inception/se-inception.md b/models/public/se-inception/se-inception.md
index a5d9ff39525..377cf879df3 100644
--- a/models/public/se-inception/se-inception.md
+++ b/models/public/se-inception/se-inception.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/se-resnet-101/se-resnet-101.md b/models/public/se-resnet-101/se-resnet-101.md
index a1b7bd5ac3d..9dc313dd7c6 100644
--- a/models/public/se-resnet-101/se-resnet-101.md
+++ b/models/public/se-resnet-101/se-resnet-101.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/se-resnet-152/se-resnet-152.md b/models/public/se-resnet-152/se-resnet-152.md
index b4af9e0f96e..4e1d3c2ab66 100644
--- a/models/public/se-resnet-152/se-resnet-152.md
+++ b/models/public/se-resnet-152/se-resnet-152.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/se-resnet-50/se-resnet-50.md b/models/public/se-resnet-50/se-resnet-50.md
index a267c735d55..5c121bfddfd 100644
--- a/models/public/se-resnet-50/se-resnet-50.md
+++ b/models/public/se-resnet-50/se-resnet-50.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name: `prob`,  shape: `1,1000`,
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/se-resnext-101/se-resnext-101.md b/models/public/se-resnext-101/se-resnext-101.md
index 33fc139fe18..b9e0e8892ed 100644
--- a/models/public/se-resnext-101/se-resnext-101.md
+++ b/models/public/se-resnext-101/se-resnext-101.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/se-resnext-50/se-resnext-50.md b/models/public/se-resnext-50/se-resnext-50.md
index c8a4d794165..b2c8f0899c4 100644
--- a/models/public/se-resnext-50/se-resnext-50.md
+++ b/models/public/se-resnext-50/se-resnext-50.md
@@ -62,4 +62,6 @@ Object classifier according to ImageNet classes, name - `prob`,  shape - `1,1000
 
 ## Legal Information
 
-[LICENSE](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE)
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/hujie-frank/SENet/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-SENet.txt](../licenses/APACHE-2.0-SENet.txt).
diff --git a/models/public/single-human-pose-estimation-0001/description/single-human-pose-estimation-0001.md b/models/public/single-human-pose-estimation-0001/description/single-human-pose-estimation-0001.md
new file mode 100644
index 00000000000..9689f62e8f5
--- /dev/null
+++ b/models/public/single-human-pose-estimation-0001/description/single-human-pose-estimation-0001.md
@@ -0,0 +1,58 @@
+# single-human-pose-estimation-0001
+
+## Use Case and High-Level Description
+Single human pose estimation model based on https://arxiv.org/pdf/1906.04104.pdf.
+
+## Specification
+
+| Metric                                                        | Value                   |
+|---------------------------------------------------------------|-------------------------|
+| AP(coco orig)                                                 | 68                      |
+| GFlops                                                        | 60.125                  |
+| MParams                                                       | 33.165                  |
+| Source framework                                              | PyTorch\*               |
+
+
+## Inputs
+
+### Original model
+
+Name: "data" , shape: [1x3x384x288] - An input image in the format [BxCxHxW],
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order - RGB. Mean values - [123.675,116.28,103.53]. Scale values - [58.395,57.12,57.375]
+
+### Converted model
+
+Name: "data" , shape: [1x3x384x288] - An input image in the format [BxCxHxW],
+   where:
+
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order - BGR.
+
+## Outputs
+
+### Original model
+
+The net outputs list of tensor. Count of list elements is 6. Every tensor with shapes: [1x17x48x36] ( For every keypoint own heatmap). The six outputs are necessary in order to calculate the loss in during training. But in the future, for obtaining the results of prediction and postprocessing them, the last output is used. Each following tensor gives more accurate predictions ( in context metric AP).
+
+
+### Converted model
+
+The net outputs tensor with shapes: [1x17x48x36]. ( For every keypoint own heatmap)
+
+## Legal Information
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../../licenses/APACHE-2.0.txt).
+
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/single-human-pose-estimation-0001/model.yml b/models/public/single-human-pose-estimation-0001/model.yml
new file mode 100644
index 00000000000..015b363c612
--- /dev/null
+++ b/models/public/single-human-pose-estimation-0001/model.yml
@@ -0,0 +1,45 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  Single human pose estimation model based on https://arxiv.org/pdf/1906.04104.pdf.
+task_type: human_pose_estimation
+files:
+  - name: single-human-pose-estimation-0001.tar.gz
+    sha256: 182c51075502643ada303a5f3a081b6adf943b711e5eddf80635582369588d34
+    size: 151979155
+    source: https://download.01.org/opencv/openvino_training_extensions/models/human_pose_estimation/single-human-pose-estimation-0001.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: single-human-pose-estimation-0001.tar.gz
+framework: pytorch
+conversion_to_onnx_args:
+  - --model-path=$dl_dir/single-human-pose-estimation-0001/
+  - --model-name=SinglePersonPoseEstimationWithMobileNet
+  - --import-module=models
+  - --weights=$dl_dir/single-human-pose-estimation-0001/single-human-pose-estimation-0001.pth
+  - --input-shape=1,3,384,288
+  - --input-names=data
+  - --output-names=heatmaps0,heatmaps1,heatmaps2,heatmaps3,heatmaps4,heatmaps
+  - --output-file=$conv_dir/single-human-pose-estimation-0001.onnx
+model_optimizer_args:
+  - --input=data
+  - --mean_values=data[123.675,116.28,103.53]
+  - --scale_values=data[58.395,57.12,57.375]
+  - --output=heatmaps
+  - --input_model=$conv_dir/single-human-pose-estimation-0001.onnx
+  - --reverse_input_channels
+  - --input_shape=[1,3,384,288]
+license: https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE
diff --git a/models/public/squeezenet1.0/model.yml b/models/public/squeezenet1.0/model.yml
index 685693f8752..6125f1a0e6f 100644
--- a/models/public/squeezenet1.0/model.yml
+++ b/models/public/squeezenet1.0/model.yml
@@ -13,17 +13,17 @@
 # limitations under the License.
 
 description: >-
-  The `squeezenet1.0` model is one of the SqueezeNet <https://arxiv.org/pdf/1602.07360>
-  topology models, is designed to perform image classification. The SqueezeNet
-  models have been pre-trained on the ImageNet image database. For details about
-  this family of models, check out the repository <https://github.com/DeepScale/SqueezeNet>.
+  The "squeezenet1.0" model is one of the SqueezeNet <https://arxiv.org/pdf/1602.07360>
+  topology models, is designed to perform image classification. The SqueezeNet models
+  have been pre-trained on the ImageNet image database. For details about this family
+  of models, check out the repository <https://github.com/DeepScale/SqueezeNet>.
 
-  The model input is a blob that consists of a single image of 1x3x227x227 in
-  BGR order. The BGR mean values need to be subtracted as follows: [104, 117,
-  123] before passing the image blob into the network.
+  The model input is a blob that consists of a single image of 1x3x227x227 in BGR
+  order. The BGR mean values need to be subtracted as follows: [104, 117, 123] before
+  passing the image blob into the network.
 
-  The model output for `squeezenet1.0` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "squeezenet1.0" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: squeezenet1.0.prototxt
diff --git a/models/public/squeezenet1.0/squeezenet1.0.md b/models/public/squeezenet1.0/squeezenet1.0.md
index 04a8de9c222..eaf5c52dff5 100644
--- a/models/public/squeezenet1.0/squeezenet1.0.md
+++ b/models/public/squeezenet1.0/squeezenet1.0.md
@@ -66,4 +66,28 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/DeepScale/SqueezeNet/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/DeepScale/SqueezeNet/master/LICENSE):
+
+```
+BSD LICENSE.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted
+provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this list of conditions
+and the following disclaimer.
+
+2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions
+and the following disclaimer in the documentation and/or other materials provided with the
+distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
+IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
+FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
+IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/squeezenet1.1-caffe2/model.yml b/models/public/squeezenet1.1-caffe2/model.yml
new file mode 100644
index 00000000000..c6d94355d1f
--- /dev/null
+++ b/models/public/squeezenet1.1-caffe2/model.yml
@@ -0,0 +1,42 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This is a Caffe2* version of "squeezenet1.1" model, designed to perform image classification.
+  This model was converted from Caffe* to Caffe2* format.  For details see repository
+  <https://github.com/caffe2/models/tree/master/squeezenet>, paper <https://arxiv.org/pdf/1602.07360>.
+task_type: classification
+files:
+  - name: predict_net.pb
+    size: 6175
+    sha256: d20be00eb448d3952265620357132916aba8744b027937b56c469b001b46472b
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/squeezenet/predict_net.pb
+  - name: init_net.pb
+    size: 6181001
+    sha256: d8115221de899d081a1a83785bf0dbaeea19463cdf7dbddba662cc7abb4f32dc
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/squeezenet/init_net.pb
+framework: caffe2
+conversion_to_onnx_args:
+  - --model-path=$dl_dir/predict_net.pb
+  - --model-name=squeezenet1.1-caffe2
+  - --weights=$dl_dir/init_net.pb
+  - --input-shape=1,3,227,227
+  - --input-names=data
+  - --output-file=$conv_dir/squeezenet1.1-caffe2.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,227,227]
+  - --input=data
+  - --mean_values=data[103.96,116.78,123.68]
+  - --input_model=$conv_dir/squeezenet1.1-caffe2.onnx
+license: https://raw.githubusercontent.com/caffe2/models/master/LICENSE
\ No newline at end of file
diff --git a/models/public/squeezenet1.1-caffe2/squeezenet1.1-caffe2.md b/models/public/squeezenet1.1-caffe2/squeezenet1.1-caffe2.md
new file mode 100644
index 00000000000..b1abf5f8cee
--- /dev/null
+++ b/models/public/squeezenet1.1-caffe2/squeezenet1.1-caffe2.md
@@ -0,0 +1,70 @@
+# squeezenet1.1-caffe2
+
+## Use Case and High-Level Description
+
+This is a Caffe2\* version of `squeezenet1.1` model, designed to perform image classification.
+This model was converted from Caffe\* to Caffe2\* format. 
+For details see repository <https://github.com/caffe2/models/tree/master/squeezenet>,
+paper <https://arxiv.org/pdf/1602.07360>.
+
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 0.784         |
+| MParams           | 1.235         |
+| Source framework  | Caffe2\*      |
+
+## Accuracy
+
+## Performance
+
+## Input
+
+### Original model
+
+Image, name - `data`, shape - `1,3,227,227`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+Mean values - [103.96,116.78,123.68].
+
+### Converted model
+
+Image, name - `data`, shape - `1,3,227,227`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `softmaxout`, shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `softmaxout`, shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/caffe2/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/squeezenet1.1/model.yml b/models/public/squeezenet1.1/model.yml
index 4293ff4cbdb..bf84c573997 100644
--- a/models/public/squeezenet1.1/model.yml
+++ b/models/public/squeezenet1.1/model.yml
@@ -13,19 +13,18 @@
 # limitations under the License.
 
 description: >-
-  The `squeezenet1.1` updated version of the SqueezeNet <https://arxiv.org/pdf/1602.07360>
-  topology. It is designed to perform image classification.  It requires 2.4x
-  less computation than SqueezeNet v1.0 <../squeezenet1.0/squeezenet1.0.md> without
-  diminishing accuracy. The SqueezeNet models have been pre-trained on the ImageNet
-  image database. For details about this family of models, check out the repository
-  <https://github.com/DeepScale/SqueezeNet>.
+  The "squeezenet1.1" updated version of the SqueezeNet <https://arxiv.org/pdf/1602.07360>
+  topology. It is designed to perform image classification.  It requires 2.4x less
+  computation than SqueezeNet v1.0 <../squeezenet1.0/squeezenet1.0.md> without diminishing
+  accuracy. The SqueezeNet models have been pre-trained on the ImageNet image database.
+  For details about this family of models, check out the repository <https://github.com/DeepScale/SqueezeNet>.
 
-  The model input is a blob that consists of a single image of 1x3x227x227 in
-  BGR order. The BGR mean values need to be subtracted as follows: [104, 117,
-  123] before passing the image blob into the network.
+  The model input is a blob that consists of a single image of 1x3x227x227 in BGR
+  order. The BGR mean values need to be subtracted as follows: [104, 117, 123] before
+  passing the image blob into the network.
 
-  The model output for `squeezenet1.1` is the typical object classifier output
-  for the 1000 different classifications matching those in the ImageNet database.
+  The model output for "squeezenet1.1" is the typical object classifier output for
+  the 1000 different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: squeezenet1.1.prototxt
diff --git a/models/public/squeezenet1.1/squeezenet1.1.md b/models/public/squeezenet1.1/squeezenet1.1.md
index f90338eb1c5..eada8e5c6b0 100644
--- a/models/public/squeezenet1.1/squeezenet1.1.md
+++ b/models/public/squeezenet1.1/squeezenet1.1.md
@@ -66,4 +66,28 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/DeepScale/SqueezeNet/master/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/DeepScale/SqueezeNet/master/LICENSE):
+
+```
+BSD LICENSE.
+
+Redistribution and use in source and binary forms, with or without modification, are permitted
+provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this list of conditions
+and the following disclaimer.
+
+2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions
+and the following disclaimer in the documentation and/or other materials provided with the
+distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
+IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
+FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
+IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
+THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+```
diff --git a/models/public/ssd300/model.yml b/models/public/ssd300/model.yml
index aaabdd3de2b..00e1022f261 100644
--- a/models/public/ssd300/model.yml
+++ b/models/public/ssd300/model.yml
@@ -14,16 +14,15 @@
 
 description: >-
   The "ssd300" model is a Single-Shot multibox Detection <SSD> <https://arxiv.org/pdf/1512.02325.pdf>
-  network intended to perform face detection. This model is implemented using
-  the Caffe\* framework. For details about this model, check out the repository
-  <https://github.com/weiliu89/caffe/tree/ssd>.
+  network intended to perform face detection. This model is implemented using the
+  Caffe* framework. For details about this model, check out the repository <https://github.com/weiliu89/caffe/tree/ssd>.
 
-  The model input is a blob that consists of a single image of 1x3x300x300 in
-  BGR order.  The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
+  The model input is a blob that consists of a single image of 1x3x300x300 in BGR
+  order.  The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
   before passing the image blob into the network.
 
-  The model output is a typical vector containing the tracked object data, as
-  previously described.
+  The model output is a typical vector containing the tracked object data, as previously
+  described.
 task_type: detection
 files:
   - name: ssd300.tar.gz
diff --git a/models/public/ssd300/ssd300.md b/models/public/ssd300/ssd300.md
index a0c7d6c9cff..562e3546f14 100644
--- a/models/public/ssd300/ssd300.md
+++ b/models/public/ssd300/ssd300.md
@@ -78,4 +78,58 @@ The array of detection summary info, name - `detection_out`,  shape - `1, 1, N,
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/weiliu89/caffe/ssd/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/weiliu89/caffe/ssd/LICENSE):
+
+```
+COPYRIGHT
+
+All new contributions compared to the original branch:
+Copyright (c) 2015, 2016 Wei Liu (UNC Chapel Hill), Dragomir Anguelov (Zoox),
+Dumitru Erhan (Google), Christian Szegedy (Google), Scott Reed (UMich Ann Arbor),
+Cheng-Yang Fu (UNC Chapel Hill), Alexander C. Berg (UNC Chapel Hill).
+All rights reserved.
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+
+Caffe uses a shared copyright model: each contributor holds copyright over
+their contributions to Caffe. The project versioning records all such
+contribution and copyright details. If a contributor wants to further mark
+their specific copyright on a particular contribution, they should indicate
+their copyright solely in the commit message of the change when it is
+committed.
+
+LICENSE
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+2. Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+CONTRIBUTION AGREEMENT
+
+By contributing to the BVLC/caffe repository through pull-request, comment,
+or otherwise, the contributor releases their content to the
+license and copyright terms herein.
+```
diff --git a/models/public/ssd512/model.yml b/models/public/ssd512/model.yml
index 875a27839c6..01b17e5f8d0 100644
--- a/models/public/ssd512/model.yml
+++ b/models/public/ssd512/model.yml
@@ -13,17 +13,16 @@
 # limitations under the License.
 
 description: >-
-  The `ssd512` model is a Single-Shot multibox Detection <SSD> <https://arxiv.org/pdf/1512.02325.pdf>
-  network intended to perform face detection. This model is implemented using
-  the Caffe\*framework. For details about this model, check out the repository
-  <https://github.com/weiliu89/caffe/tree/ssd>.
+  The "ssd512" model is a Single-Shot multibox Detection <SSD> <https://arxiv.org/pdf/1512.02325.pdf>
+  network intended to perform face detection. This model is implemented using the
+  Caffe*framework. For details about this model, check out the repository <https://github.com/weiliu89/caffe/tree/ssd>.
 
-  The model input is a blob that consists of a single image of 1x3x512x512 in
-  BGR order. The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
+  The model input is a blob that consists of a single image of 1x3x512x512 in BGR
+  order. The BGR mean values need to be subtracted as follows: [104.0,117.0,123.0]
   before passing the image blob into the network.
 
-  The model output is a typical vector containing the tracked object data, as
-  previously described.
+  The model output is a typical vector containing the tracked object data, as previously
+  described.
 task_type: detection
 files:
   - name: ssd512.tar.gz
diff --git a/models/public/ssd512/ssd512.md b/models/public/ssd512/ssd512.md
index 20307138184..b5ec2c34752 100644
--- a/models/public/ssd512/ssd512.md
+++ b/models/public/ssd512/ssd512.md
@@ -78,4 +78,58 @@ The array of detection summary info, name - `detection_out`,  shape - `1, 1, N,
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/weiliu89/caffe/ssd/LICENSE]()
+The original model is distributed under the following
+[license](https://raw.githubusercontent.com/weiliu89/caffe/ssd/LICENSE):
+
+```
+COPYRIGHT
+
+All new contributions compared to the original branch:
+Copyright (c) 2015, 2016 Wei Liu (UNC Chapel Hill), Dragomir Anguelov (Zoox),
+Dumitru Erhan (Google), Christian Szegedy (Google), Scott Reed (UMich Ann Arbor),
+Cheng-Yang Fu (UNC Chapel Hill), Alexander C. Berg (UNC Chapel Hill).
+All rights reserved.
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+
+Caffe uses a shared copyright model: each contributor holds copyright over
+their contributions to Caffe. The project versioning records all such
+contribution and copyright details. If a contributor wants to further mark
+their specific copyright on a particular contribution, they should indicate
+their copyright solely in the commit message of the change when it is
+committed.
+
+LICENSE
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+2. Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+CONTRIBUTION AGREEMENT
+
+By contributing to the BVLC/caffe repository through pull-request, comment,
+or otherwise, the contributor releases their content to the
+license and copyright terms herein.
+```
diff --git a/models/public/ssd_mobilenet_v1_coco/model.yml b/models/public/ssd_mobilenet_v1_coco/model.yml
index 67053b84909..0ac357d3737 100644
--- a/models/public/ssd_mobilenet_v1_coco/model.yml
+++ b/models/public/ssd_mobilenet_v1_coco/model.yml
@@ -13,11 +13,10 @@
 # limitations under the License.
 
 description: >-
-  The `ssd_mobilenet_v1_coco` model is a Single-Shot multibox Detection <SSD>
-  <https://arxiv.org/pdf/1801.04381.pdf> network intended to perform object detection.
-  The difference bewteen this model and the `mobilenet-ssd` is that there the
-  `mobilenet-ssd` can only detect face, the `ssd_mobilenet_v1_coco` model can
-  detect objects.
+  The "ssd_mobilenet_v1_coco" model is a Single-Shot multibox Detection <SSD> <https://arxiv.org/pdf/1801.04381.pdf>
+  network intended to perform object detection. The difference bewteen this model
+  and the "mobilenet-ssd" is that there the "mobilenet-ssd" can only detect face,
+  the "ssd_mobilenet_v1_coco" model can detect objects.
 task_type: detection
 files:
   - name: ssd_mobilenet_v1_coco.tar.gz
@@ -33,7 +32,7 @@ model_optimizer_args:
   - --input_shape=[1,300,300,3]
   - --input=image_tensor
   - --output=detection_scores,detection_boxes,num_detections
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/ssd_mobilenet_v1_coco_2018_01_28/pipeline.config
   - --input_model=$dl_dir/ssd_mobilenet_v1_coco_2018_01_28/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/ssd_mobilenet_v1_coco/ssd_mobilenet_v1_coco.md b/models/public/ssd_mobilenet_v1_coco/ssd_mobilenet_v1_coco.md
index 85e7be1d32f..75c20449029 100644
--- a/models/public/ssd_mobilenet_v1_coco/ssd_mobilenet_v1_coco.md
+++ b/models/public/ssd_mobilenet_v1_coco/ssd_mobilenet_v1_coco.md
@@ -69,4 +69,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/ssd_mobilenet_v1_fpn_coco/model.yml b/models/public/ssd_mobilenet_v1_fpn_coco/model.yml
index 0695b41c58c..4900a13b96e 100644
--- a/models/public/ssd_mobilenet_v1_fpn_coco/model.yml
+++ b/models/public/ssd_mobilenet_v1_fpn_coco/model.yml
@@ -13,8 +13,7 @@
 # limitations under the License.
 
 description: >-
-  MobileNetV1 FPN. Used for object detection. For details see paper
-  <https://arxiv.org/pdf/1807.03284.pdf>.
+  MobileNetV1 FPN is used for object detection. For details, see the paper <https://arxiv.org/pdf/1807.03284.pdf>.
 task_type: detection
 files:
   - name: ssd_mobilenet_v1_fpn_shared_box_predictor_640x640_coco14_sync_2018_07_03.tar.gz
@@ -30,7 +29,7 @@ model_optimizer_args:
   - --input_shape=[1,640,640,3]
   - --input=image_tensor
   - --output=detection_scores,detection_boxes,num_detections
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/ssd_mobilenet_v1_fpn_shared_box_predictor_640x640_coco14_sync_2018_07_03/pipeline.config
   - --input_model=$dl_dir/ssd_mobilenet_v1_fpn_shared_box_predictor_640x640_coco14_sync_2018_07_03/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/ssd_mobilenet_v1_fpn_coco/ssd_mobilenet_v1_fpn_coco.md b/models/public/ssd_mobilenet_v1_fpn_coco/ssd_mobilenet_v1_fpn_coco.md
index f4c77170c7a..8b7bbfd567c 100644
--- a/models/public/ssd_mobilenet_v1_fpn_coco/ssd_mobilenet_v1_fpn_coco.md
+++ b/models/public/ssd_mobilenet_v1_fpn_coco/ssd_mobilenet_v1_fpn_coco.md
@@ -71,4 +71,6 @@ where:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/ssd_mobilenet_v2_coco/model.yml b/models/public/ssd_mobilenet_v2_coco/model.yml
index c0ea1039f7c..878a776c611 100644
--- a/models/public/ssd_mobilenet_v2_coco/model.yml
+++ b/models/public/ssd_mobilenet_v2_coco/model.yml
@@ -13,19 +13,16 @@
 # limitations under the License.
 
 description: >-
-  The `ssd_mobilenet_v2_coco` model is a Single-Shot multibox Detection <SSD>
-  <https://arxiv.org/pdf/1801.04381.pdf> network intended to perform object detection.
-  The difference between this model and the `mobilenet-ssd` is that the while
-  `mobilenet-ssd` detects faces only, the `ssd_mobilenet_v2_coco` model detects
-  objects, as it has been trained from the Common Objects in Context (COCO) image
-  dataset.
+  The "ssd_mobilenet_v2_coco" model is a Single-Shot multibox Detection <SSD> <https://arxiv.org/pdf/1801.04381.pdf>
+  network intended to perform object detection. The model has been trained from the
+  Common Objects in Context (COCO) image dataset.
 
-  The model input is a blob that consists of a single image of 1x3x300x300 in
-  RGB order.
+  The model input is a blob that consists of a single image of 1x3x300x300 in RGB
+  order.
 
-  The model output is a typical vector containing the tracked object data, as
-  previously described. Note that the "class_id" data is now significant and should
-  be used to determine the classification for any detected object.
+  The model output is a typical vector containing the tracked object data, as previously
+  described. Note that the "class_id" data is now significant and should be used to
+  determine the classification for any detected object.
 task_type: detection
 files:
   - name: ssd_mobilenet_v2_coco.tar.gz
@@ -40,7 +37,7 @@ model_optimizer_args:
   - --reverse_input_channels
   - --input_shape=[1,300,300,3]
   - --input=image_tensor
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/ssd_mobilenet_v2_coco_2018_03_29/pipeline.config
   - --output=detection_classes,detection_scores,detection_boxes,num_detections
   - --input_model=$dl_dir/ssd_mobilenet_v2_coco_2018_03_29/frozen_inference_graph.pb
diff --git a/models/public/ssd_mobilenet_v2_coco/ssd_mobilenet_v2_coco.md b/models/public/ssd_mobilenet_v2_coco/ssd_mobilenet_v2_coco.md
index ac2f802a4c6..924b6c67a1c 100644
--- a/models/public/ssd_mobilenet_v2_coco/ssd_mobilenet_v2_coco.md
+++ b/models/public/ssd_mobilenet_v2_coco/ssd_mobilenet_v2_coco.md
@@ -2,7 +2,7 @@
 
 ## Use Case and High-Level Description
 
-The `ssd_mobilenet_v2_coco` model is a [Single-Shot multibox Detection (SSD)](https://arxiv.org/pdf/1801.04381.pdf) network intended to perform object detection. The difference between this model and the `mobilenet-ssd` is that the while `mobilenet-ssd` detects faces only, the `ssd_mobilenet_v2_coco` model detects objects, as it has been trained from the Common Objects in Context (COCO) image dataset.
+The `ssd_mobilenet_v2_coco` model is a [Single-Shot multibox Detection (SSD)](https://arxiv.org/pdf/1801.04381.pdf) network intended to perform object detection. The model has been trained from the Common Objects in Context (COCO) image dataset.
 
 The model input is a blob that consists of a single image of 1x3x300x300 in RGB order.
 
@@ -74,4 +74,6 @@ The array of summary detection information, name - `detection_out`,  shape - `1,
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/ssdlite_mobilenet_v2/model.yml b/models/public/ssdlite_mobilenet_v2/model.yml
index e2735747e6e..cbfebcd4d0d 100644
--- a/models/public/ssdlite_mobilenet_v2/model.yml
+++ b/models/public/ssdlite_mobilenet_v2/model.yml
@@ -13,8 +13,9 @@
 # limitations under the License.
 
 description: >-
-  MobileNetV2: Inverted Residuals and Linear Bottlenecks. Used for object detection.
-  For details see paper <https://arxiv.org/pdf/1801.04381.pdf>.
+  The "ssdlite_mobilenet_v2" model is used for object detection. For details, see
+  the paper <https://arxiv.org/pdf/1801.04381.pdf>, MobileNetV2: Inverted Residuals
+  and Linear Bottlenecks.
 task_type: detection
 files:
   - name: ssdlite_mobilenet_v2_coco_2018_05_09.tar.gz
@@ -30,7 +31,7 @@ model_optimizer_args:
   - --input_shape=[1,300,300,3]
   - --input=image_tensor
   - --output=detection_scores,detection_boxes,num_detections
-  - --tensorflow_use_custom_operations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
+  - --transformations_config=$mo_dir/extensions/front/tf/ssd_v2_support.json
   - --tensorflow_object_detection_api_pipeline_config=$dl_dir/ssdlite_mobilenet_v2_coco_2018_05_09/pipeline.config
   - --input_model=$dl_dir/ssdlite_mobilenet_v2_coco_2018_05_09/frozen_inference_graph.pb
 framework: tf
diff --git a/models/public/ssdlite_mobilenet_v2/ssdlite_mobilenet_v2.md b/models/public/ssdlite_mobilenet_v2/ssdlite_mobilenet_v2.md
index e1fd006558b..d929317552d 100644
--- a/models/public/ssdlite_mobilenet_v2/ssdlite_mobilenet_v2.md
+++ b/models/public/ssdlite_mobilenet_v2/ssdlite_mobilenet_v2.md
@@ -69,4 +69,6 @@ bounding boxes. For each detection, the description has the format:
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/tensorflow/models/master/LICENSE]()
\ No newline at end of file
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/tensorflow/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../licenses/APACHE-2.0-TensorFlow.txt).
diff --git a/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.jpg b/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.jpg
new file mode 100644
index 00000000000..df80e616cd7
Binary files /dev/null and b/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.jpg differ
diff --git a/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.md b/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.md
new file mode 100644
index 00000000000..359cae78841
--- /dev/null
+++ b/models/public/vehicle-license-plate-detection-barrier-0123/description/vehicle-license-plate-detection-barrier-0123.md
@@ -0,0 +1,86 @@
+# vehicle-license-plate-detection-barrier-0123
+
+## Use Case and High-level Description
+
+This is a MobileNetV2 + SSD-based vehicle and (Chinese) license plate detector for
+the "Barrier" use case.
+
+## Example
+![](./vehicle-license-plate-detection-barrier-0123.jpg)
+
+## Specification
+
+| Metric                          | Value                                      |
+|---------------------------------|--------------------------------------------|
+| Mean Average Precision (mAP)    | 99.52%                                     |
+| AP vehicles                     | 99.90%                                     |
+| AP plates                       | 99.13%                                     |
+| Car pose                        | Front facing cars                          |
+| Min plate width                 | 96 pixels                                  |
+| Max objects to detect           | 200                                        |
+| GFlops                          | 8.666                                      |
+| MParams                         | 0.547                                      |
+| Source framework                | TensorFlow*                                |
+
+Average Precision (AP) is defined as an area under the
+[precision/recall](https://en.wikipedia.org/wiki/Precision_and_recall)
+curve. Validation dataset is BIT-Vehicle.
+
+## Performance
+
+## Input
+
+### Original Model
+
+An input image, name: `input` , shape: [1x256x256x3], format: [BxHxWxC],
+   where:
+
+    - B - batch size
+    - H - image height
+    - W - image width
+    - C - number of channels
+
+   Expected color order: RGB.
+   Mean values: [127.5,127.5,127.5], scale factor for each channel: 127.5
+
+### Converted Model
+
+An input image, name: `input`, shape: [1x3x256x256], format [BxCxHxW],
+   where:
+    - B - batch size
+    - C - number of channels
+    - H - image height
+    - W - image width
+
+   Expected color order is BGR.
+
+## Output
+
+### Original Model
+
+The net outputs a blob with the shape: [1, 1, N, 7], where N is the number of detected
+   bounding boxes. For each detection, the description has the format:
+   [`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`]
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner.
+
+### Converted Model
+
+The net outputs a blob with the shape: [1, 1, N, 7], where N is the number of detected
+   bounding boxes. For each detection, the description has the format:
+   [`image_id`, `label`, `conf`, `x_min`, `y_min`, `x_max`, `y_max`]
+    - `image_id` - ID of the image in the batch
+    - `label` - predicted class ID
+    - `conf` - confidence for the predicted class
+    - (`x_min`, `y_min`) - coordinates of the top left bounding box corner
+    - (`x_max`, `y_max`) - coordinates of the bottom right bounding box corner.
+
+## Legal Information
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/opencv/openvino_training_extensions/develop/LICENSE).
+A copy of the license is provided in [APACHE-2.0-TensorFlow.txt](../../licenses/APACHE-2.0.txt).
+
+[*] Other names and brands may be claimed as the property of others.
diff --git a/models/public/vehicle-license-plate-detection-barrier-0123/model.yml b/models/public/vehicle-license-plate-detection-barrier-0123/model.yml
new file mode 100644
index 00000000000..6675ed02793
--- /dev/null
+++ b/models/public/vehicle-license-plate-detection-barrier-0123/model.yml
@@ -0,0 +1,37 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This is a MobileNetV2 + SSD-based vehicle and (Chinese) license plate detector for
+  the "Barrier" use case.
+task_type: detection
+files:
+  - name: ssd-mobilenet-v2-0.35.1-barrier-256x256-0123.tar.gz
+    size: 4387714
+    sha256: de6744bc72339f29109f595bc51b47383595ffb06ed15a7438f2ae9cb8a2a77c
+    source: https://download.01.org/opencv/openvino_training_extensions/models/ssd_detector/ssd-mobilenet-v2-0.35.1-barrier-256x256-0123.tar.gz
+postprocessing:
+  - $type: unpack_archive
+    format: gztar
+    file: ssd-mobilenet-v2-0.35.1-barrier-256x256-0123.tar.gz
+model_optimizer_args:
+  - --reverse_input_channels
+  - --input_shape=[1,256,256,3]
+  - --scale=127.5
+  - --mean_values=[127.5,127.5,127.5]
+  - --transformations_config=$dl_dir/model/model.tfmo.json
+  - --output=ssd_heads/concat_reshape_softmax/mbox_loc_final,ssd_heads/concat_reshape_softmax/mbox_conf_final,ssd_heads/concat_reshape_softmax/mbox_priorbox
+  - --input_model=$dl_dir/model/model.pb.frozen
+framework: tf
+license: https://raw.githubusercontent.com/opencv/training_toolbox_tensorflow/develop/LICENSE
diff --git a/models/public/vgg16/model.yml b/models/public/vgg16/model.yml
index 23d8145ca55..26510b6b31f 100644
--- a/models/public/vgg16/model.yml
+++ b/models/public/vgg16/model.yml
@@ -13,15 +13,15 @@
 # limitations under the License.
 
 description: >-
-  The `vgg16` model is one of the vgg <https://arxiv.org/pdf/1409.1556.pdf> models
-  designed to perform image classification in Caffe\*format.
+  The "vgg16" model is one of the vgg <https://arxiv.org/pdf/1409.1556.pdf> models
+  designed to perform image classification in Caffe*format.
 
-  The model input is a blob that consists of a single image of "1x3x224x224" in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.939, 116.779,
+  The model input is a blob that consists of a single image of "1x3x224x224" in BGR
+  order. The BGR mean values need to be subtracted as follows: [103.939, 116.779,
   123.68] before passing the image blob into the network.
 
-  The model output for `vgg16` is the typical object classifier output for the
-  1000 different classifications matching those in the ImageNet database.
+  The model output for "vgg16" is the typical object classifier output for the 1000
+  different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: vgg16.prototxt
diff --git a/models/public/vgg16/vgg16.md b/models/public/vgg16/vgg16.md
index e03983ce893..b64aaea0639 100644
--- a/models/public/vgg16/vgg16.md
+++ b/models/public/vgg16/vgg16.md
@@ -66,4 +66,6 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/keras-team/keras/master/LICENSE]()
+The original model is distributed under the
+[Creative Commons Attribution 4.0 International Public License](https://creativecommons.org/licenses/by/4.0/legalcode.txt).
+A copy of the license is provided in [CC-BY-4.0.txt](../licenses/CC-BY-4.0.txt).
diff --git a/models/public/vgg19-caffe2/model.yml b/models/public/vgg19-caffe2/model.yml
new file mode 100644
index 00000000000..76d308345b0
--- /dev/null
+++ b/models/public/vgg19-caffe2/model.yml
@@ -0,0 +1,42 @@
+# Copyright (c) 2019 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+description: >-
+  This is a Caffe2* version of "vgg19" model, designed to perform image classification.
+  This model was converted from Caffe* to Caffe2* format.  For details see repository
+  <https://github.com/caffe2/models/tree/master/vgg19>, paper <https://arxiv.org/pdf/1409.1556.pdf>.
+task_type: classification
+files:
+  - name: predict_net.pb
+    size: 2862
+    sha256: ebb8608fe80ee8bce096a60ecf3e6e8442eb118aaa0fa77d5d58b5dcff7dfb5f
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/vgg19/predict_net.pb
+  - name: init_net.pb
+    size: 718338501
+    sha256: 492dbbbc7dd23cb052c66964714759f88370f3fa8542aa32556e93abc7beb69f
+    source: https://s3.amazonaws.com/download.caffe2.ai/models/vgg19/init_net.pb
+framework: caffe2
+conversion_to_onnx_args:
+  - --model-path=$dl_dir/predict_net.pb
+  - --model-name=vgg19-caffe2
+  - --weights=$dl_dir/init_net.pb
+  - --input-shape=1,3,224,224
+  - --input-names=data
+  - --output-file=$conv_dir/vgg19-caffe2.onnx
+model_optimizer_args:
+  - --input_shape=[1,3,224,224]
+  - --input=data
+  - --mean_values=data[103.939,116.779,123.68]
+  - --input_model=$conv_dir/vgg19-caffe2.onnx
+license: https://raw.githubusercontent.com/caffe2/models/master/LICENSE
\ No newline at end of file
diff --git a/models/public/vgg19-caffe2/vgg19-caffe2.md b/models/public/vgg19-caffe2/vgg19-caffe2.md
new file mode 100644
index 00000000000..c7bcd6393d8
--- /dev/null
+++ b/models/public/vgg19-caffe2/vgg19-caffe2.md
@@ -0,0 +1,69 @@
+# vgg19-caffe2
+
+## Use Case and High-Level Description
+
+This is a Caffe2\* version of `vgg19` model, designed to perform image classification.
+This model was converted from Caffe\* to Caffe2\* format. 
+For details see repository <https://github.com/caffe2/models/tree/master/vgg19>,
+paper <https://arxiv.org/pdf/1409.1556.pdf>.
+## Example
+
+## Specification
+
+| Metric            | Value         |
+|-------------------|---------------|
+| Type              | Classification|
+| GFLOPs            | 39.3          |
+| MParams           | 143.667       |
+| Source framework  | Caffe2\*      |
+
+## Accuracy
+
+## Performance
+
+## Input
+
+### Original mode
+
+Image, name - `data`,  shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+Mean values - [103.939, 116.779, 123.68].
+
+### Converted model
+
+Image, name - `data`, shape - `1,3,224,224`, format is `B,C,H,W` where:
+
+- `B` - batch size
+- `C` - channel
+- `H` - height
+- `W` - width
+
+Channel order is `BGR`.
+
+## Output
+
+### Original model
+
+Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+### Converted model
+
+Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`, output data format is `B,C` where:
+
+- `B` - batch size
+- `C` - predicted probabilities for each class in  [0, 1] range
+
+## Legal Information
+
+The original model is distributed under the
+[Apache License, Version 2.0](https://raw.githubusercontent.com/caffe2/models/master/LICENSE).
+A copy of the license is provided in [APACHE-2.0.txt](../licenses/APACHE-2.0.txt).
diff --git a/models/public/vgg19/model.yml b/models/public/vgg19/model.yml
index 5c2bba96055..229ab72c88a 100644
--- a/models/public/vgg19/model.yml
+++ b/models/public/vgg19/model.yml
@@ -13,15 +13,15 @@
 # limitations under the License.
 
 description: >-
-  The `vgg19` model is one of the vgg <https://arxiv.org/pdf/1409.1556.pdf> models
-  designed to perform image classification in Caffe\* format.
+  The "vgg19" model is one of the vgg <https://arxiv.org/pdf/1409.1556.pdf> models
+  designed to perform image classification in Caffe* format.
 
-  The model input is a blob that consists of a single image of 1x3x224x224 in
-  BGR order. The BGR mean values need to be subtracted as follows: [103.939, 116.779,
+  The model input is a blob that consists of a single image of 1x3x224x224 in BGR
+  order. The BGR mean values need to be subtracted as follows: [103.939, 116.779,
   123.68] before passing the image blob into the network.
 
-  The model output for `vgg19` is the typical object classifier output for the
-  1000 different classifications matching those in the ImageNet database.
+  The model output for "vgg19" is the typical object classifier output for the 1000
+  different classifications matching those in the ImageNet database.
 task_type: classification
 files:
   - name: vgg19.prototxt
diff --git a/models/public/vgg19/vgg19.md b/models/public/vgg19/vgg19.md
index ca5ddcebc38..123fab9c456 100644
--- a/models/public/vgg19/vgg19.md
+++ b/models/public/vgg19/vgg19.md
@@ -66,4 +66,6 @@ Object classifier according to ImageNet classes, name - `prob`, shape - `1,1000`
 
 ## Legal Information
 
-[https://raw.githubusercontent.com/keras-team/keras/master/LICENSE]()
+The original model is distributed under the
+[Creative Commons Attribution 4.0 International Public License](https://creativecommons.org/licenses/by/4.0/legalcode.txt).
+A copy of the license is provided in [CC-BY-4.0.txt](../licenses/CC-BY-4.0.txt).
diff --git a/tools/accuracy_checker/.pylintrc b/tools/accuracy_checker/.pylintrc
index 9c6fd442b41..c27ba95f9dd 100644
--- a/tools/accuracy_checker/.pylintrc
+++ b/tools/accuracy_checker/.pylintrc
@@ -21,7 +21,7 @@ disable = C0103,
 max-line-length = 120
 ignore-docstrings = yes
 extension-pkg-whitelist=inference_engine,cv2,numpy,mxnet,tensorflow,pycocotools,onnxruntime
-ignored-modules = numpy,cv2,openvino.inference_engine,caffe,mxnet,tensorflow,pycocotools,onnxruntime
+ignored-modules = numpy,cv2,openvino.inference_engine,caffe,mxnet,tensorflow,pycocotools,onnxruntime,torch
 load-plugins = pylint_checkers
 ignored-classes = pathlib.PurePath
 jobs=0
diff --git a/tools/accuracy_checker/.yamllint b/tools/accuracy_checker/.yamllint
new file mode 100644
index 00000000000..880eebad36b
--- /dev/null
+++ b/tools/accuracy_checker/.yamllint
@@ -0,0 +1,29 @@
+yaml-files:
+  - '*.yaml'
+  - '*.yml'
+  - '.yamllint'
+
+rules:
+  line-length: disable
+  braces: enable
+  brackets: enable
+  colons: disable
+  commas: enable
+  comments:
+    level: warning
+  comments-indentation:
+    level: warning
+  document-end: disable
+  document-start: disable
+  empty-lines: enable
+  empty-values: enable
+  hyphens: enable
+  indentation: enable
+  key-duplicates: enable
+  key-ordering: disable
+  new-line-at-end-of-file: enable
+  new-lines: enable
+  octal-values: disable
+  quoted-strings: disable
+  trailing-spaces: enable
+  truthy: disable
diff --git a/tools/accuracy_checker/README.md b/tools/accuracy_checker/README.md
index d36daf4479c..e212f629633 100644
--- a/tools/accuracy_checker/README.md
+++ b/tools/accuracy_checker/README.md
@@ -45,10 +45,11 @@ In order to evaluate some models required frameworks have to be installed. Accur
 
 - [OpenVINO](https://software.intel.com/en-us/openvino-toolkit/documentation/get-started).
 - [Caffe](accuracy_checker/launcher/caffe_installation_readme.md).
-- [MxNet](https://mxnet.incubator.apache.org/versions/master/).
+- [MXNet](https://mxnet.apache.org/).
 - [OpenCV DNN](https://docs.opencv.org/4.1.0/d2/de6/tutorial_py_setup_in_ubuntu.html).
 - [TensorFlow](https://www.tensorflow.org/).
 - [ONNX Runtime](https://github.com/microsoft/onnxruntime/blob/master/README.md).
+- [PyTorch](https://pytorch.org/)
 
 You can use any of them or several at a time.
 
@@ -60,6 +61,13 @@ If all prerequisite are installed, then you are ready to install **accuracy chec
 python3 setup.py install
 ```
 
+Accuracy Checker is modular tool and have some task-specific dependencies, all required modules can be found in `requirements.in` file.
+You can install tool without dependencies and manage them by your-self using following command instead of standard installation:
+
+```bash
+pip install . --no-dependencies
+```
+
 #### Usage
 
 You may test your installation and get familiar with accuracy checker by running [sample](sample/README.md).
@@ -87,6 +95,13 @@ You may refer to `-h, --help` to full list of command line options. Some optiona
 - `-tf, --target_framework` framework for infer.
 - `-td, --target_devices` devices for infer. You can specify several devices using space as a delimiter.
 
+You are also able to replace some command line arguments with environment variables for path prefixing. Supported following list of variables:
+* `DATA_DIR` -  equivalent of `-s`, `--source`.
+* `MODELS_DIR` - equivalent of `-m`, `--models`.
+* `EXTENSIONS` - equivalent of `-e`, `--extensions`.
+* `ANNOTATIONS_DIR` - equivalent of `-a`, `--annotations`.
+* `BITSTREAMS_DIR` - equivalent of `-b`, `--bitstreams`.
+
 #### Configuration
 
 There is config file which declares validation process.
@@ -110,6 +125,10 @@ models:
   datasets:
     - name: dataset_name
 ```
+Optionally you can use global configuration. It can be useful for avoiding duplication if you have several models which should be run on the same dataset.
+Example of global definitions file can be found [here](dataset_definitions.yml). Global definitions will be merged with evaluation config in the runtime by dataset name. 
+Parameters of global configuration can be overwritten by local config (e.g. if in definitions specified resize with destination size 224 and in the local config used resize with size 227, the value in config - 227 will be used as resize parameter)
+You can use field `global_definitions` for specifying path to global definitions directly in the model config or via command line arguments (`-d`, `--definitions`).
 
 ### Launchers
 
@@ -120,10 +139,11 @@ Please view:
 - [how to configure Caffe launcher](accuracy_checker/launcher/caffe_launcher_readme.md).
 - [how to configure DLSDK launcher](accuracy_checker/launcher/dlsdk_launcher_readme.md).
 - [how to configure OpenCV launcher](accuracy_checker/launcher/opencv_launcher_readme.md).
-- [how to configure MxNet Launcher](accuracy_checker/launcher/mxnet_launcher_readme.md).
+- [how to configure MXNet Launcher](accuracy_checker/launcher/mxnet_launcher_readme.md).
 - [how to configure TensorFlow Launcher](accuracy_checker/launcher/tf_launcher_readme.md).
 - [how to configure TensorFlow Lite Launcher](accuracy_checker/launcher/tf_lite_launcher_readme.md).
 - [how to configure ONNX Runtime Launcher](accuracy_checker/launcher/onnx_runtime_launcher_readme.md).
+- [how to configure PyTorch Launcher](accuracy_checker/launcher/pytorch_launcher_readme.md)
 
 ### Datasets
 
@@ -216,3 +236,9 @@ Typical workflow for testing new model include:
 1. Choose one of *adapters* or write your own. Adapter converts raw output produced by framework to high level problem specific representation (e.g. *ClassificationPrediction*, *DetectionPrediction*, etc).
 1. Reproduce preprocessing, metrics and postprocessing from canonical paper.
 1. Create entry in config file and execute.
+
+### Customizing Evaluation
+
+Standard Accuracy Checker validation pipeline: Annotation Reading -> Data Reading -> Preprocessing -> Inference -> Postprocessing -> Metrics.
+In some cases it can be unsuitable (e.g. if you have sequence of models). You are able to customize validation pipeline using own evaluator.
+More details about custom evaluations can be found in [related section](custom_evaluators/README.md).
diff --git a/tools/accuracy_checker/accuracy_checker/__init__.py b/tools/accuracy_checker/accuracy_checker/__init__.py
index b6d89a2d811..1ecfbfdc449 100644
--- a/tools/accuracy_checker/accuracy_checker/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/__init__.py
@@ -14,4 +14,4 @@
 limitations under the License.
 """
 
-__version__ = "0.7.3"
+__version__ = "0.7.5"
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/README.md b/tools/accuracy_checker/accuracy_checker/adapters/README.md
index 224c2040ede..de67d83e644 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/README.md
+++ b/tools/accuracy_checker/accuracy_checker/adapters/README.md
@@ -20,36 +20,40 @@ AccuracyChecker supports following set of adapters:
 * `classification` - converting output of classification model to `ClassificationPrediction` representation.
 * `segmentation` - converting output of semantic segmentation model to `SeegmentationPrediction` representation.
   * `make_argmax` - allows to apply argmax operation to output values.
+* `segmentation_one_class` - converting output of semantic segmentation to `SeegmentationPrediction` representation. It is suitable for situation when model's output is probability of belong each pixel to foreground class.
+  * `threshold` - minimum probability threshold for valid class belonging.
 * `tiny_yolo_v1` - converting output of Tiny YOLO v1 model to `DetectionPrediction` representation.
 * `reid` - converting output of reidentification model to `ReIdentificationPrediction` representation.
   * `grn_workaround` - enabling processing output with adding Global Region Normalization layer.
 * `yolo_v2` - converting output of YOLO v2 family models to `DetectionPrediction` representation.
   * `classes` - number of detection classes (default 20).
-  * `anchors` - anchor values provided as comma-separated list or one of precomputed: 
+  * `anchors` - anchor values provided as comma-separated list or one of precomputed:
     - `yolo_v2` - `[1.3221, 1.73145, 3.19275, 4.00944, 5.05587, 8.09892, 9.47112, 4.84053, 11.2364, 10.0071]`,
     - `tiny_yolo_v2` - `[1.08, 1.19, 3.42, 4.41, 6.63, 11.38, 9.42, 5.11, 16.62, 10.52]`
   * `coords` - number of bbox coordinates (default 4).
   * `num` - num parameter from DarkNet configuration file (default 5).
+  * `cells` - number of cells across width and height (default 13).
 * `yolo_v3` - converting output of YOLO v3 family models to `DetectionPrediction` representation.
   * `classes` - number of detection classes (default 80).
-  * `anchors` - anchor values provided as comma-separited list or precomputed: 
+  * `anchors` - anchor values provided as comma-separited list or precomputed:
     - `yolo_v3` - `[10.0, 13.0, 16.0, 30.0, 33.0, 23.0, 30.0, 61.0, 62.0, 45.0, 59.0, 119.0, 116.0, 90.0, 156.0, 198.0, 373.0, 326.0]`
     - `tiny_yolo_v3` - `[10.0, 14.0, 23.0, 27.0, 37.0, 58.0, 81.0, 82.0, 135.0, 169.0, 344.0, 319.0]`
   * `coords` - number of bbox coordinates (default 4).
   * `num` - num parameter from DarkNet configuration file (default 3).
+  * `anchor_mask` - mask for used anchors for each output layer (Optional, if not provided default way for selecting anchors will be used.)
   * `threshold` - minimal objectness score value for valid detections (default 0.001).
   * `input_width` and `input_height` - network input width and height correspondingly (default 416).
   * `outputs` - the list of output layers names (optional), if specified there should be exactly 3 output layers provided.
 * `lpr` - converting output of license plate recognition model to `CharacterRecognitionPrediction` representation.
 * `ssd` - converting  output of SSD model to `DetectionPrediction` representation.
-* `ssd_mxnet` - converting output of SSD-based models from MxNet framework to `DetectionPrediction` representation.
-* `pytorch_ssd_decoder` - converts output of SSD model from Pytorch without embedded decoder.
+* `ssd_mxnet` - converting output of SSD-based models from MXNet framework to `DetectionPrediction` representation.
+* `pytorch_ssd_decoder` - converts output of SSD model from PyTorch without embedded decoder.
   * `scores_out` - name of output layer with bounding boxes scores.
   * `boxes_out` - name of output layer with bounding boxes coordinates.
   * `confidence_threshold` - lower bound for valid boxes scores (optional, default 0.05).
   * `nms_threshold` - overlap threshold for NMS (optional, default 0.5).
   * `keep_top_k ` - maximal number of boxes which should be kept (optional, default 200).
-* `ssd_onnx` - converting output of SSD-based model from Pytorch with NonMaxSuppression layer.
+* `ssd_onnx` - converting output of SSD-based model from PyTorch with NonMaxSuppression layer.
   * `labels_out` - name of output layer with labels or regular expression for it searching.
   * `scores_out`- name of output layer with scores or regular expression for it searching.
   * `bboxes_out` - name of output layer with bboxes or regular expression for it searching.
@@ -58,15 +62,18 @@ AccuracyChecker supports following set of adapters:
   * `boxes_out` - name of output layer with predicted boxes coordinates in format [y0, x0, y1, x1].
   *  `scores_out` - name of output layer with detection scores.
   * `num_detections_out` - name of output layer which contains the number of valid detections.
-* `face_person_detection` - converting face person detection model output with 2 detection outputs to `ContainerPredition`, where value of parameters `face_out`and `person_out` are used for identification `DetectionPrediction` in container. 
+* `retinanet` - converting output of RetinaNet-based model.
+  * `loc_out` - name of output layer with bounding box deltas.
+  * `class_out` - name of output layer with classification probabilities.
+* `face_person_detection` - converting face person detection model output with 2 detection outputs to `ContainerPredition`, where value of parameters `face_out`and `person_out` are used for identification `DetectionPrediction` in container.
   * `face_out` -  face detection output layer name.
   * `person_out` - person detection output layer name.
 * `person_attributes` - converting person attributes recognition model output to `MultiLabelRecognitionPrediction`.
   * `attributes_recognition_out` - output layer name with attributes scores. (optional, used if your model has more than one outputs).
-* `vehicle_attributes`  - converting vehicle attributes recognition model output to `ContainerPrediction` where value of parameters `color_out`and `type_out` are used for identification `ClassificationPrediction` in container. 
+* `vehicle_attributes`  - converting vehicle attributes recognition model output to `ContainerPrediction` where value of parameters `color_out`and `type_out` are used for identification `ClassificationPrediction` in container.
   * `color_out` - vehicle color attribute output layer name.
   * `type_out`- vehicle type attribute output layer name.
-* `head_pose` - converting head pose estimation model output to `ContainerPrediction` where names of parameters `angle_pitch`, `angle_yaw` and `angle_roll` are used for identification `RegressionPrediction` in container. 
+* `head_pose` - converting head pose estimation model output to `ContainerPrediction` where names of parameters `angle_pitch`, `angle_yaw` and `angle_roll` are used for identification `RegressionPrediction` in container.
   * `angle_pitch` - output layer name for pitch angle.
   * `angle_yaw`- output layer name for yaw angle.
   * `angle_roll` - output layer name for roll angle.
@@ -85,6 +92,13 @@ AccuracyChecker supports following set of adapters:
   * `action_scale` - scale for correct action score calculation.
 * `super_resolution` - converting output of single image super resolution network to `SuperResolutionPrediction`.
   * `reverse_channels` - allow switching output image channels e.g. RGB to BGR (Optional. Default value is False).
+  * `mean` - value or list channel-wise values which should be added to result for getting values in range [0, 255] (Optional, default 0)
+  * `std` - value or list channel-wise values on which result should be multiplied for getting values in range [0, 255] (Optional, default 255)
+  **Important** Usually `mean` and `std` are the same which used in preprocessing, here they are used for reverting these preprocessing operations. 
+  The order of actions:
+  1. Multiply on `std`
+  2. Add `mean`
+  3. Reverse channels if this option enabled.
 * `landmarks_regression` - converting output of model for landmarks regression to `FacialLandmarksPrediction`.
 * `pixel_link_text_detection` - converting output of PixelLink like model for text detection to `TextDetectionPrediction`.
   * `pixel_class_out` - name of layer containing information related to text/no-text classification for each pixel.
@@ -113,6 +127,7 @@ AccuracyChecker supports following set of adapters:
 * `human_pose_estimation` - converting output of model for human pose estimation to `PoseEstimationPrediction`.
   * `part_affinity_fields_out` - name of output layer with keypoints pairwise relations (part affinity fields).
   * `keypoints_heatmap_out` - name of output layer with keypoints heatmaps.
+  The output layers can be omitted if model has only one output layer - concatenation of this 2.
 * `beam_search_decoder` - realization CTC Beam Search decoder for symbol sequence recognition, converting model output to `CharacterRecognitionPrediction`.
   * `beam_size` -  size of the beam to use during decoding (default 10).
   * `blank_label` - index of the CTC blank label.
@@ -120,6 +135,37 @@ AccuracyChecker supports following set of adapters:
 * `gaze_estimation` - converting output of gaze estimation model to `GazeVectorPrediction`.
 * `hit_ratio_adapter` - converting output NCF model to `HitRatioPrediction`.
 * `brain_tumor_segmentation` - converting output of brain tumor segmentation model to `BrainTumorSegmentationPrediction`.
+  * `make_argmax`  - allows to apply argmax operation to output values. (default - `False`)
+  * `label_order` - sets mapping from output classes to dataset classes. For example: `label_order: [3,1,2]` means that class with id 3 from model's output matches with class with id 1 from dataset,  class with id 1 from model's output matches with class with id 2 from dataset, class with id 2 from model's output matches with class with id 3 from dataset.
 * `nmt` - converting output of neural machine translation model to `MachineTranslationPrediction`.
   * `vocabulary_file` - file which contains vocabulary for encoding model predicted indexes to words (e. g. vocab.bpe.32000.de). Path can be prefixed with `--models` arguments.
   * `eos_index` - index end of string symbol in vocabulary (Optional, used in cases when launcher does not support dynamic output shape for cut off empty prediction).
+* `bert_question_answering` - converting output of BERT model trained to solve question answering task to `QuestionAnsweringPrediction`.
+* `bert_classification` - converting output of BERT model trained for classification task to `ClassificationPrediction`.
+  * `num_classes` - number of predicted classes.
+  * `classification_out` - name of output layer with classification probabilities. (Optional, if not provided default first output blob will be used).
+* `human_pose_estimation_3d` - converting output of model for 3D human pose estimation to `PoseEstimation3dPrediction`.
+  * `features_3d_out` - name of output layer with 3D coordinates maps.
+  * `keypoints_heatmap_out` - name of output layer with keypoints heatmaps.
+  * `part_affinity_fields_out` - name of output layer with keypoints pairwise relations (part affinity fields).
+* `ctdet` - converting output of CenterNet object detection model to `DetectionPrediction`.
+  * `center_heatmap_out` - name of output layer with center points heatmaps.
+  * `width_height_out` - name of the output layer with object sizes.
+  * `regression_out` - name of the regression output with the offset prediction.
+* `mask_rcnn` - converting raw outputs of Mask-RCNN to combination of `DetectionPrediction` and `CoCocInstanceSegmentationPrediction`.
+  * `classes_out` - name of output layer with information about classes (optional, if your model has detection_output layer as output).
+  * `scores_out` - name of output layer with bbox scores (optional, if your model has detection_output layer as output).
+  * `boxes_out` - name of output layer with bboxes (optional, if your model has detection_output layer as output).
+  * `raw_masks_out` - name of output layer with raw instances masks.
+  * `num_detections_out` - name of output layer with number valid detections (used in MaskRCNN models trained with TF Object Detection API).
+  * `detection_out` - SSD-like detection output layer name (optional, if your model has scores_out, boxes_out and classes_out).
+* `mask_rcnn_with_text` - converting raw outputs of Mask-RCNN with additional Text Recognition head to `TextDetectionPrediction`.
+  * `classes_out` - name of output layer with information about classes.
+  * `scores_out` - name of output layer with bbox scores.
+  * `boxes_out` - name of output layer with bboxes.
+  * `raw_masks_out` - name of output layer with raw instances masks.
+  * `texts_out` - name of output layer with texts.
+  * `confidence_threshold` - confidence threshold that is used to filter out detected instances.
+* `fcos_person` - converting output of FCOS (single class) model to `DetectionPrediction` representation.
+  * `output_blob` - name of output layer with bboxes.
+  * `scale` - scalar value to normalize bbox coordinates.
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/__init__.py b/tools/accuracy_checker/accuracy_checker/adapters/__init__.py
index ac8c4b57ede..23f8b857f15 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/__init__.py
@@ -37,19 +37,32 @@
 
 from .reidentification import ReidAdapter
 from .detection import (
-    TinyYOLOv1Adapter, SSDAdapter, FacePersonAdapter, YoloV2Adapter, YoloV3Adapter, TFObjectDetectionAPIAdapter
+    SSDAdapter,
+    FacePersonAdapter,
+    TFObjectDetectionAPIAdapter,
+    SSDAdapterMxNet,
+    PyTorchSSDDecoder,
+    SSDONNXAdapter,
+    MTCNNPAdapter,
+    RetinaNetAdapter,
+    FCOSPersonAdapter
 )
+from .yolo import TinyYOLOv1Adapter, YoloV2Adapter, YoloV3Adapter
 from .classification import ClassificationAdapter
 from .segmentation import SegmentationAdapter, BrainTumorSegmentationAdapter
 from .pose_estimation import HumanPoseAdapter
+from .pose_estimation_3d import HumanPose3dAdapter
 
 from .dummy_adapters import XML2DetectionAdapter
 
 from .hit_ratio import HitRatioAdapter
 
 from .mask_rcnn import MaskRCNNAdapter
+from .mask_rcnn_with_text import MaskRCNNWithTextAdapter
 
-from .nlp import MachineTranslationAdapter
+from .nlp import MachineTranslationAdapter, QuestionAnsweringAdapter
+
+from .centernet import CTDETAdapter
 
 __all__ = [
     'Adapter',
@@ -61,11 +74,15 @@
     'ClassificationAdapter',
 
     'SSDAdapter',
-    'TinyYOLOv1Adapter',
-    'YoloV2Adapter',
-    'YoloV3Adapter',
     'FacePersonAdapter',
     'TFObjectDetectionAPIAdapter',
+    'SSDAdapterMxNet',
+    'SSDONNXAdapter',
+    'PyTorchSSDDecoder',
+    'MTCNNPAdapter',
+    'CTDETAdapter',
+    'RetinaNetAdapter',
+    'FCOSPersonAdapter',
 
     'SegmentationAdapter',
     'BrainTumorSegmentationAdapter',
@@ -89,12 +106,15 @@
     'LPRAdapter',
 
     'HumanPoseAdapter',
+    'HumanPose3dAdapter',
 
     'ActionDetection',
 
     'HitRatioAdapter',
 
     'MaskRCNNAdapter',
+    'MaskRCNNWithTextAdapter',
 
-    'MachineTranslationAdapter'
+    'MachineTranslationAdapter',
+    'QuestionAnsweringAdapter',
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/action_recognition.py b/tools/accuracy_checker/accuracy_checker/adapters/action_recognition.py
index b2921435ad7..019ba3dd1bd 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/action_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/action_recognition.py
@@ -14,6 +14,7 @@
 limitations under the License.
 """
 
+import re
 import numpy as np
 
 from ..adapters import Adapter
@@ -100,6 +101,7 @@ def configure(self):
         self.action_threshold = self.get_value_from_config('action_confidence_threshold')
         self.action_scale = self.get_value_from_config('action_scale')
         add_conf_out_prefix = self.get_value_from_config('add_conf_out_prefix')
+        self.outputs_verified = False
 
         if self.multihead:
             self.in_sizes = self.get_value_from_config('in_sizes')
@@ -137,6 +139,8 @@ def configure(self):
     def process(self, raw, identifiers=None, frame_meta=None):
         result = []
         raw_outputs = self._extract_predictions(raw, frame_meta)
+        if not self.outputs_verified:
+            self._get_output_names(raw_outputs)
         prior_boxes = raw_outputs[self.priorbox_out][0][0].reshape(-1, 4) if not self.multihead else None
         prior_variances = raw_outputs[self.priorbox_out][0][1].reshape(-1, 4) if not self.multihead else None
 
@@ -272,3 +276,22 @@ def generate_prior_box(pos, step, anchor, image_size, blob_size):
         ]
 
         return normalized_bbox
+
+    def _get_output_names(self, raw_outputs):
+        loc_out_regex = re.compile(self.loc_out)
+        main_conf_out_regex = re.compile(self.main_conf_out)
+
+        def find_layer(regex, output_name, all_outputs):
+            suitable_layers = [layer_name for layer_name in all_outputs if regex.match(layer_name)]
+            if not suitable_layers:
+                raise ValueError('suitable layer for {} output is not found'.format(output_name))
+
+            if len(suitable_layers) > 1:
+                raise ValueError('more than 1 layers matched to regular expression, please specify more detailed regex')
+
+            return suitable_layers[0]
+
+        self.loc_out = find_layer(loc_out_regex, 'loc', raw_outputs)
+        self.main_conf_out = find_layer(main_conf_out_regex, 'main confidence', raw_outputs)
+
+        self.outputs_verified = True
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/adapter.py b/tools/accuracy_checker/accuracy_checker/adapters/adapter.py
index bee31bed6d3..1da70d8aec0 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/adapter.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/adapter.py
@@ -109,6 +109,7 @@ def create_adapter(adapter_config, launcher=None, dataset=None):
         adapter = Adapter.provide(adapter_config['type'], adapter_config, label_map=label_map)
     else:
         raise ConfigError('Unknown type for adapter configuration')
+
     if launcher:
         adapter.output_blob = launcher.output_blob
 
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/centernet.py b/tools/accuracy_checker/accuracy_checker/adapters/centernet.py
new file mode 100644
index 00000000000..aab9f410b74
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/adapters/centernet.py
@@ -0,0 +1,159 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import numpy as np
+from numpy.lib.stride_tricks import as_strided
+
+from ..adapters import Adapter
+from ..config import StringField
+from ..preprocessor import CenterNetAffineTransformation
+from ..representation import DetectionPrediction
+
+
+class CTDETAdapter(Adapter):
+    __provider__ = 'ctdet'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update(
+            {
+                'center_heatmap_out': StringField(description="Object center points heatmap."),
+                'width_height_out': StringField(description='Object size output.'),
+                'regression_out': StringField(description='Regression output.')
+            }
+        )
+        return parameters
+
+    def configure(self):
+        self.center_heatmap_out = self.get_value_from_config('center_heatmap_out')
+        self.width_height_out = self.get_value_from_config('width_height_out')
+        self.regression_out = self.get_value_from_config('regression_out')
+
+    @staticmethod
+    def _gather_feat(feat, ind):
+        dim = feat.shape[1]
+        ind = np.expand_dims(ind, axis=1)
+        ind = np.repeat(ind, dim, axis=1)
+        feat = feat[ind, np.arange(feat.shape[1])]
+        return feat
+
+    @staticmethod
+    def _tranpose_and_gather_feat(feat, ind):
+        feat = np.transpose(feat, (1, 2, 0))
+        feat = feat.reshape((-1, feat.shape[2]))
+        feat = CTDETAdapter._gather_feat(feat, ind)
+        return feat
+
+    @staticmethod
+    def _topk(scores, K=40):
+        cat, height, width = scores.shape
+
+        scores = scores.reshape((cat, -1))
+        topk_inds = np.argpartition(scores, -K, axis=1)[:, -K:]
+        topk_scores = scores[np.arange(scores.shape[0])[:, None], topk_inds]
+
+        topk_inds = topk_inds % (height * width)
+        topk_ys = (topk_inds / width).astype(np.int32).astype(np.float)
+        topk_xs = (topk_inds % width).astype(np.int32).astype(np.float)
+
+        topk_scores = topk_scores.reshape((-1))
+        topk_ind = np.argpartition(topk_scores, -K)[-K:]
+        topk_score = topk_scores[topk_ind]
+        topk_clses = (topk_ind / K).astype(np.int32)
+        topk_inds = CTDETAdapter._gather_feat(
+            topk_inds.reshape((-1, 1)), topk_ind).reshape((K))
+        topk_ys = CTDETAdapter._gather_feat(topk_ys.reshape((-1, 1)), topk_ind).reshape((K))
+        topk_xs = CTDETAdapter._gather_feat(topk_xs.reshape((-1, 1)), topk_ind).reshape((K))
+
+        return topk_score, topk_inds, topk_clses, topk_ys, topk_xs
+
+    @staticmethod
+    def _nms(heat, kernel=3):
+        def max_pool2d(A, kernel_size, padding=1, stride=1):
+            A = np.pad(A, padding, mode='constant')
+            output_shape = ((A.shape[0] - kernel_size)//stride + 1,
+                            (A.shape[1] - kernel_size)//stride + 1)
+            kernel_size = (kernel_size, kernel_size)
+            A_w = as_strided(A, shape=output_shape + kernel_size,
+                             strides=(stride*A.strides[0],
+                                      stride*A.strides[1]) + A.strides)
+            A_w = A_w.reshape(-1, *kernel_size)
+
+            return A_w.max(axis=(1, 2)).reshape(output_shape)
+
+        pad = (kernel - 1) // 2
+
+        hmax = np.array([max_pool2d(channel, kernel, pad) for channel in heat])
+        keep = (hmax == heat)
+        return heat * keep
+
+    @staticmethod
+    def _transform_preds(coords, center, scale, output_size):
+        def affine_transform(pt, t):
+            new_pt = np.array([pt[0], pt[1], 1.], dtype=np.float32).T
+            new_pt = np.dot(t, new_pt)
+            return new_pt[:2]
+
+        target_coords = np.zeros(coords.shape)
+        trans = CenterNetAffineTransformation.get_affine_transform(center, scale, 0, output_size, inv=1)
+        for p in range(coords.shape[0]):
+            target_coords[p, 0:2] = affine_transform(coords[p, 0:2], trans)
+        return target_coords
+
+    @staticmethod
+    def _transform(dets, center, scale, heigth, width):
+        dets[:, :2] = CTDETAdapter._transform_preds(
+            dets[:, 0:2], center, scale, (width, heigth))
+        dets[:, 2:4] = CTDETAdapter._transform_preds(
+            dets[:, 2:4], center, scale, (width, heigth))
+        return dets
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        result = []
+        predictions_batch = self._extract_predictions(raw, frame_meta)
+        hm_batch = predictions_batch[self.center_heatmap_out]
+        wh_batch = predictions_batch[self.width_height_out]
+        reg_batch = predictions_batch[self.regression_out]
+        for identifier, heat, wh, reg, meta in zip(identifiers, hm_batch, wh_batch, reg_batch, frame_meta):
+            heat = np.exp(heat)/(1 + np.exp(heat))
+            height, width = heat.shape[1:3]
+
+            heat = self._nms(heat)
+            scores, inds, clses, ys, xs = self._topk(heat, K=100)
+            reg = self._tranpose_and_gather_feat(reg, inds)
+            num_predictions = 100
+
+            reg = reg.reshape((num_predictions, 2))
+            xs = xs.reshape((num_predictions, 1)) + reg[:, 0:1]
+            ys = ys.reshape((num_predictions, 1)) + reg[:, 1:2]
+
+            wh = self._tranpose_and_gather_feat(wh, inds)
+            wh = wh.reshape((num_predictions, 2))
+            clses = clses.reshape((num_predictions, 1)).astype(np.float)
+            scores = scores.reshape((num_predictions, 1))
+            bboxes = np.concatenate((xs - wh[..., 0:1] / 2,
+                                     ys - wh[..., 1:2] / 2,
+                                     xs + wh[..., 0:1] / 2,
+                                     ys + wh[..., 1:2] / 2), axis=1)
+            detections = np.concatenate((bboxes, scores, clses), axis=1)
+            im_size = meta.get('image_size')
+            scale = max(im_size)
+            center = np.array(im_size[:2])/2.0
+            dets = self._transform(detections, np.flip(center), scale, height, width)
+            x_min, y_min, x_max, y_max, scores, classes = dets.transpose(1, 0)
+            result.append(DetectionPrediction(identifier, classes, scores, x_min, y_min, x_max, y_max))
+        return result
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/classification.py b/tools/accuracy_checker/accuracy_checker/adapters/classification.py
index 75f16b312c2..fd15715d161 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/classification.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/classification.py
@@ -54,6 +54,8 @@ def process(self, raw, identifiers=None, frame_meta=None):
             list of ClassificationPrediction objects
         """
         prediction = self._extract_predictions(raw, frame_meta)[self.output_blob]
+        if len(np.shape(prediction)) == 1:
+            prediction = np.expand_dims(prediction, axis=0)
         prediction = np.reshape(prediction, (prediction.shape[0], -1))
 
         result = []
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/detection.py b/tools/accuracy_checker/accuracy_checker/adapters/detection.py
index 44a7459410b..0b011d4204b 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/detection.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/detection.py
@@ -20,327 +20,11 @@
 
 import numpy as np
 
-from ..topology_types import YoloV1Tiny, YoloV2, YoloV2Tiny, YoloV3, YoloV3Tiny, SSD, FasterRCNN
+from ..topology_types import SSD, FasterRCNN
 from ..adapters import Adapter
-from ..config import ConfigValidator, NumberField, StringField, ListField
+from ..config import ConfigValidator, NumberField, StringField
 from ..postprocessor.nms import NMS
 from ..representation import DetectionPrediction, ContainerPrediction
-from ..utils import get_or_parse_value
-
-
-class TinyYOLOv1Adapter(Adapter):
-    """
-    Class for converting output of Tiny YOLO v1 model to DetectionPrediction representation
-    """
-    __provider__ = 'tiny_yolo_v1'
-    prediction_types = (DetectionPrediction, )
-    topology_types = (YoloV1Tiny, )
-
-    def process(self, raw, identifiers=None, frame_meta=None):
-        """
-        Args:
-            identifiers: list of input data identifiers
-            raw: output of model
-        Returns:
-             list of DetectionPrediction objects
-        """
-        prediction = self._extract_predictions(raw, frame_meta)[self.output_blob]
-
-        PROBABILITY_SIZE = 980
-        CONFIDENCE_SIZE = 98
-        BOXES_SIZE = 392
-
-        CELLS_X, CELLS_Y = 7, 7
-        CLASSES = 20
-        OBJECTS_PER_CELL = 2
-
-        result = []
-        for identifier, output in zip(identifiers, prediction):
-            assert PROBABILITY_SIZE + CONFIDENCE_SIZE + BOXES_SIZE == output.shape[0]
-
-            probability, scale, boxes = np.split(output, [PROBABILITY_SIZE, PROBABILITY_SIZE + CONFIDENCE_SIZE])
-
-            probability = np.reshape(probability, (CELLS_Y, CELLS_X, CLASSES))
-            scale = np.reshape(scale, (CELLS_Y, CELLS_X, OBJECTS_PER_CELL))
-            boxes = np.reshape(boxes, (CELLS_Y, CELLS_X, OBJECTS_PER_CELL, 4))
-
-            confidence = np.zeros((CELLS_Y, CELLS_X, OBJECTS_PER_CELL, CLASSES + 4))
-            for cls in range(CLASSES):
-                confidence[:, :, 0, cls] = np.multiply(probability[:, :, cls], scale[:, :, 0])
-                confidence[:, :, 1, cls] = np.multiply(probability[:, :, cls], scale[:, :, 1])
-
-            labels, scores, x_mins, y_mins, x_maxs, y_maxs = [], [], [], [], [], []
-            for i, j, k in np.ndindex((CELLS_X, CELLS_Y, OBJECTS_PER_CELL)):
-                box = boxes[j, i, k]
-                box = [(box[0] + i) / float(CELLS_X), (box[1] + j) / float(CELLS_Y), box[2] ** 2, box[3] ** 2]
-
-                label = np.argmax(confidence[j, i, k, :CLASSES])
-                score = confidence[j, i, k, label]
-
-                labels.append(label)
-                scores.append(score)
-                x_mins.append(box[0] - box[2] / 2.0)
-                y_mins.append(box[1] - box[3] / 2.0)
-                x_maxs.append(box[0] + box[2] / 2.0)
-                y_maxs.append(box[1] + box[3] / 2.0)
-
-            result.append(DetectionPrediction(identifier, labels, scores, x_mins, y_mins, x_maxs, y_maxs))
-
-        return result
-
-
-def entry_index(w, h, n_coords, n_classes, pos, entry):
-    row = pos // (w * h)
-    col = pos % (w * h)
-    return row * w * h * (n_classes + n_coords + 1) + entry * w * h + col
-
-
-class YoloV2Adapter(Adapter):
-    """
-    Class for converting output of YOLO v2 family models to DetectionPrediction representation
-    """
-    __provider__ = 'yolo_v2'
-    prediction_types = (DetectionPrediction, )
-    topology_types = (YoloV2, YoloV2Tiny, )
-
-    PRECOMPUTED_ANCHORS = {
-        'yolo_v2': [1.3221, 1.73145, 3.19275, 4.00944, 5.05587, 8.09892, 9.47112, 4.84053, 11.2364, 10.0071],
-        'tiny_yolo_v2': [1.08, 1.19, 3.42, 4.41, 6.63, 11.38, 9.42, 5.11, 16.62, 10.52]
-    }
-
-    @classmethod
-    def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
-            'classes': NumberField(
-                value_type=int, optional=True, min_value=1, default=20, description="Number of detection classes."
-            ),
-            'coords': NumberField(
-                value_type=int, optional=True, min_value=1, default=4, description="Number of bbox coordinates."
-            ),
-            'num': NumberField(
-                value_type=int, optional=True, min_value=1, default=5,
-                description="Num parameter from DarkNet configuration file."
-            ),
-            'anchors': StringField(
-                optional=True, choices=YoloV2Adapter.PRECOMPUTED_ANCHORS,
-                allow_own_choice=True, default='yolo_v2',
-                description="Anchor values provided as comma-separated list or one of precomputed: "
-                            "{}".format(', '.join(YoloV2Adapter.PRECOMPUTED_ANCHORS)))
-        })
-        return parameters
-
-    def validate_config(self):
-        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
-
-    def configure(self):
-        self.classes = self.get_value_from_config('classes')
-        self.coords = self.get_value_from_config('coords')
-        self.num = self.get_value_from_config('num')
-        self.anchors = get_or_parse_value(self.get_value_from_config('anchors'), YoloV2Adapter.PRECOMPUTED_ANCHORS)
-
-    def process(self, raw, identifiers=None, frame_meta=None):
-        """
-        Args:
-            identifiers: list of input data identifiers
-            raw: output of model
-        Returns:
-            list of DetectionPrediction objects
-        """
-        predictions = self._extract_predictions(raw, frame_meta)[self.output_blob]
-
-        cells_x, cells_y = 13, 13
-
-        result = []
-        for identifier, prediction in zip(identifiers, predictions):
-            labels, scores, x_mins, y_mins, x_maxs, y_maxs = [], [], [], [], [], []
-            for y, x, n in np.ndindex((cells_y, cells_x, self.num)):
-                index = n * cells_y * cells_x + y * cells_x + x
-
-                box_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, 0)
-                obj_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords)
-
-                scale = prediction[obj_index]
-
-                box = [
-                    (x + prediction[box_index + 0 * (cells_y * cells_x)]) / cells_x,
-                    (y + prediction[box_index + 1 * (cells_y * cells_x)]) / cells_y,
-                    np.exp(prediction[box_index + 2 * (cells_y * cells_x)]) * self.anchors[2 * n + 0] / cells_x,
-                    np.exp(prediction[box_index + 3 * (cells_y * cells_x)]) * self.anchors[2 * n + 1] / cells_y
-                ]
-
-                classes_prob = np.empty(self.classes)
-                for cls in range(self.classes):
-                    cls_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords + 1 + cls)
-                    classes_prob[cls] = prediction[cls_index]
-
-                classes_prob = classes_prob * scale
-
-                label = np.argmax(classes_prob)
-
-                labels.append(label)
-                scores.append(classes_prob[label])
-                x_mins.append(box[0] - box[2] / 2.0)
-                y_mins.append(box[1] - box[3] / 2.0)
-                x_maxs.append(box[0] + box[2] / 2.0)
-                y_maxs.append(box[1] + box[3] / 2.0)
-
-            result.append(DetectionPrediction(identifier, labels, scores, x_mins, y_mins, x_maxs, y_maxs))
-
-        return result
-
-
-class YoloV3Adapter(Adapter):
-    """
-    Class for converting output of YOLO v3 family models to DetectionPrediction representation
-    """
-    __provider__ = 'yolo_v3'
-    prediction_types = (DetectionPrediction, )
-    topology_types = (YoloV3, YoloV3Tiny, )
-
-    PRECOMPUTED_ANCHORS = {
-        'yolo_v3': [
-            10.0, 13.0,
-            16.0, 30.0,
-            33.0, 23.0,
-            30.0, 61.0,
-            62.0, 45.0,
-            59.0, 119.0,
-            116.0, 90.0,
-            156.0, 198.0,
-            373.0, 326.0
-        ],
-        'tiny_yolo_v3': [
-            10.0, 14.0,
-            23.0, 27.0,
-            37.0, 58.0,
-            81.0, 82.0,
-            135.0, 169.0,
-            344.0, 319.0
-        ]
-    }
-
-    @classmethod
-    def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
-            'classes': NumberField(
-                value_type=int, optional=True, min_value=1, default=80, description="Number of detection classes."
-            ),
-            'coords': NumberField(
-                value_type=int, optional=True, min_value=1, default=4, description="Number of bbox coordinates."
-            ),
-            'num': NumberField(
-                value_type=int, optional=True, min_value=1, default=3,
-                description="Num parameter from DarkNet configuration file."
-            ),
-            'anchors': StringField(
-                optional=True, choices=YoloV3Adapter.PRECOMPUTED_ANCHORS.keys(), allow_own_choice=True,
-                default='yolo_v3',
-                description="Anchor values provided as comma-separated list or one of precomputed: "
-                            "{}.".format(', '.join(YoloV3Adapter.PRECOMPUTED_ANCHORS.keys()))),
-            'threshold': NumberField(value_type=float, optional=True, min_value=0, default=0.001,
-                                     description="Minimal objectiveness score value for valid detections."),
-            'outputs': ListField(
-                optional=True, default=[],
-                description="The list of output layers names (optional),"
-                            " if specified there should be exactly 3 output layers provided."
-            )
-        })
-
-        return parameters
-
-    def validate_config(self):
-        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
-
-    def configure(self):
-        self.classes = self.get_value_from_config('classes')
-        self.coords = self.get_value_from_config('coords')
-        self.num = self.get_value_from_config('num')
-        self.anchors = get_or_parse_value(self.get_value_from_config('anchors'), YoloV3Adapter.PRECOMPUTED_ANCHORS)
-        self.threshold = self.get_value_from_config('threshold')
-        self.outputs = self.get_value_from_config('outputs')
-
-    def process(self, raw, identifiers=None, frame_meta=None):
-        """
-        Args:
-            identifiers: list of input data identifiers
-            raw: output of model
-        Returns:
-            list of DetectionPrediction objects
-        """
-
-        def get_anchors_offset(x):
-            return int((self.num * 2) * (len(self.anchors) / (self.num * 2) - 1 - math.log2(x / 13)))
-
-        def parse_yolo_v3_results(prediction, threshold, w, h, det):
-            cells_x, cells_y = prediction.shape[1:]
-            prediction = prediction.flatten()
-            for y, x, n in np.ndindex((cells_y, cells_x, self.num)):
-                index = n * cells_y * cells_x + y * cells_x + x
-                anchors_offset = get_anchors_offset(cells_x)
-
-                box_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, 0)
-                obj_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords)
-
-                scale = prediction[obj_index]
-                if scale < threshold:
-                    continue
-
-                box = [
-                    (x + prediction[box_index + 0 * (cells_y * cells_x)]) / cells_x,
-                    (y + prediction[box_index + 1 * (cells_y * cells_x)]) / cells_y,
-                    np.exp(prediction[box_index + 2 * (cells_y * cells_x)]) * self.anchors[
-                        anchors_offset + 2 * n + 0] / w,
-                    np.exp(prediction[box_index + 3 * (cells_y * cells_x)]) * self.anchors[
-                        anchors_offset + 2 * n + 1] / h
-                ]
-
-                classes_prob = np.empty(self.classes)
-                for cls in range(self.classes):
-                    cls_index = entry_index(cells_x, cells_y, self.coords, self.classes, index,
-                                            self.coords + 1 + cls)
-                    classes_prob[cls] = prediction[cls_index] * scale
-
-                    det['labels'].append(cls)
-                    det['scores'].append(classes_prob[cls])
-                    det['x_mins'].append(box[0] - box[2] / 2.0)
-                    det['y_mins'].append(box[1] - box[3] / 2.0)
-                    det['x_maxs'].append(box[0] + box[2] / 2.0)
-                    det['y_maxs'].append(box[1] + box[3] / 2.0)
-
-            return det
-
-        result = []
-
-        raw_outputs = self._extract_predictions(raw, frame_meta)
-
-        if self.outputs:
-            outputs = self.outputs
-        else:
-            outputs = raw_outputs.keys()
-
-        batch = len(identifiers)
-        predictions = [[] for _ in range(batch)]
-        for blob in outputs:
-            for b in range(batch):
-                predictions[b].append(raw_outputs[blob][b])
-
-        for identifier, prediction, meta in zip(identifiers, predictions, frame_meta):
-            detections = {'labels': [], 'scores': [], 'x_mins': [], 'y_mins': [], 'x_maxs': [], 'y_maxs': []}
-            input_shape = list(meta.get('input_shape', {'data': (1, 3, 416, 416)}).values())[0]
-            self.input_width = input_shape[3]
-            self.input_height = input_shape[2]
-
-            for p in prediction:
-                parse_yolo_v3_results(p, self.threshold, self.input_width, self.input_height, detections)
-
-            result.append(DetectionPrediction(
-                identifier, detections['labels'], detections['scores'], detections['x_mins'], detections['y_mins'],
-                detections['x_maxs'], detections['y_maxs']
-            ))
-
-        return result
 
 
 class SSDAdapter(Adapter):
@@ -625,7 +309,7 @@ def process(self, raw, identifiers=None, frame_meta=None):
 
 class SSDAdapterMxNet(Adapter):
     """
-    Class for converting output of MxNet SSD model to DetectionPrediction representation
+    Class for converting output of MXNet SSD model to DetectionPrediction representation
     """
     __provider__ = 'ssd_mxnet'
 
@@ -703,3 +387,307 @@ def find_layer(regex, output_name, all_outputs):
         self.bboxes_out = find_layer(bboxes_regex, 'bboxes', raw_outputs)
 
         self.outputs_verified = True
+
+
+class MTCNNPAdapter(Adapter):
+    __provider__ = 'mtcnn_p'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update(
+            {
+                'probability_out': StringField(description='Name of Output layer with detection boxes probabilities'),
+                'region_out': StringField(description='Name of output layer with detected regions'),
+                'regions_format': StringField(
+                    optional=True, choices=['hw', 'wh'], default='wh',
+                    description='determination of coordinates order in regions, wh uses order x1y1x2y2, hw - y1x1y2x2'
+                )
+            }
+        )
+
+        return parameters
+
+    def configure(self):
+        self.probability_out = self.get_value_from_config('probability_out')
+        self.region_out = self.get_value_from_config('region_out')
+        self.regions_format = self.get_value_from_config('regions_format')
+
+    @staticmethod
+    def nms(boxes, threshold, overlap_type):
+        """
+        Args:
+          boxes: [:,0:5]
+          threshold: 0.5 like
+          overlap_type: 'Min' or 'Union'
+        Returns:
+            indexes of passed boxes
+        """
+        if boxes.shape[0] == 0:
+            return np.array([])
+        x1 = boxes[:, 0]
+        y1 = boxes[:, 1]
+        x2 = boxes[:, 2]
+        y2 = boxes[:, 3]
+        scores = boxes[:, 4]
+        area = np.multiply(x2 - x1 + 1, y2 - y1 + 1)
+        inds = np.array(scores.argsort())
+
+        pick = []
+        while np.size(inds) > 0:
+            xx1 = np.maximum(x1[inds[-1]], x1[inds[0:-1]])
+            yy1 = np.maximum(y1[inds[-1]], y1[inds[0:-1]])
+            xx2 = np.minimum(x2[inds[-1]], x2[inds[0:-1]])
+            yy2 = np.minimum(y2[inds[-1]], y2[inds[0:-1]])
+            width = np.maximum(0.0, xx2 - xx1 + 1)
+            height = np.maximum(0.0, yy2 - yy1 + 1)
+            inter = width * height
+            if overlap_type == 'Min':
+                overlap = inter / np.minimum(area[inds[-1]], area[inds[0:-1]])
+            else:
+                overlap = inter / (area[inds[-1]] + area[inds[0:-1]] - inter)
+            pick.append(inds[-1])
+            inds = inds[np.where(overlap <= threshold)[0]]
+
+        return pick
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        total_boxes_batch = self._extract_predictions(raw, frame_meta)
+        results = []
+        for total_boxes, identifier in zip(total_boxes_batch, identifiers):
+            if np.size(total_boxes) == 0:
+                results.append(DetectionPrediction(identifier, [], [], [], [], [], []))
+                continue
+            pick = self.nms(total_boxes, 0.7, 'Union')
+            total_boxes = total_boxes[pick]
+            regh = total_boxes[:, 3] - total_boxes[:, 1]
+            regw = total_boxes[:, 2] - total_boxes[:, 0]
+            x_mins = total_boxes[:, 0] + total_boxes[:, 5] * regw
+            y_mins = total_boxes[:, 1] + total_boxes[:, 6] * regh
+            x_maxs = total_boxes[:, 2] + total_boxes[:, 7] * regw
+            y_maxs = total_boxes[:, 3] + total_boxes[:, 8] * regh
+            scores = total_boxes[:, 4]
+            results.append(
+                DetectionPrediction(identifier, np.full_like(scores, 1), scores, x_mins, y_mins, x_maxs, y_maxs)
+            )
+
+
+        return results
+
+    @staticmethod
+    def generate_bounding_box(mapping, reg, scale, t, r_format):
+        stride = 2
+        cellsize = 12
+        mapping = mapping.T
+        indexes = [0, 1, 2, 3] if r_format == 'wh' else [1, 0, 3, 2]
+        dx1 = reg[indexes[0], :, :].T
+        dy1 = reg[indexes[1], :, :].T
+        dx2 = reg[indexes[2], :, :].T
+        dy2 = reg[indexes[3], :, :].T
+        (x, y) = np.where(mapping >= t)
+
+        yy = y
+        xx = x
+
+        score = mapping[x, y]
+        reg = np.array([dx1[x, y], dy1[x, y], dx2[x, y], dy2[x, y]])
+
+        if reg.shape[0] == 0:
+            pass
+        bounding_box = np.array([yy, xx]).T
+
+        bb1 = np.fix((stride * bounding_box + 1) / scale).T  # matlab index from 1, so with "boundingbox-1"
+        bb2 = np.fix((stride * bounding_box + cellsize - 1 + 1) / scale).T  # while python don't have to
+        score = np.array([score])
+
+        bounding_box_out = np.concatenate((bb1, bb2, score, reg), axis=0)
+
+        return bounding_box_out.T
+
+    def _extract_predictions(self, outputs_list, meta):
+        if not meta[0] or 'scales' not in meta[0]:
+            return outputs_list[0]
+        scales = meta[0]['scales']
+        total_boxes = np.zeros((0, 9), np.float)
+        for idx, outputs in enumerate(outputs_list):
+            scale = scales[idx]
+            mapping = outputs[self.probability_out][0, 1, :, :]
+            regions = outputs[self.region_out][0]
+            boxes = self.generate_bounding_box(mapping, regions, scale, 0.6, self.regions_format)
+            if boxes.shape[0] != 0:
+                pick = self.nms(boxes, 0.5, 'Union')
+
+                if np.size(pick) > 0:
+                    boxes = np.array(boxes)[pick, :]
+
+            if boxes.shape[0] != 0:
+                total_boxes = np.concatenate((total_boxes, boxes), axis=0)
+
+        return [total_boxes]
+
+
+class RetinaNetAdapter(Adapter):
+    __provider__ = 'retinanet'
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'loc_out': StringField(description='boxes localization output'),
+            'class_out':  StringField(description="output with classes probabilities")
+        })
+        return params
+
+    def configure(self):
+        self.loc_out = self.get_value_from_config('loc_out')
+        self.cls_out = self.get_value_from_config('class_out')
+        self.pyramid_levels = [3, 4, 5, 6, 7]
+        self.strides = [2 ** x for x in self.pyramid_levels]
+        self.sizes = [2 ** (x + 2) for x in self.pyramid_levels]
+        self.ratios = np.array([0.5, 1, 2])
+        self.scales = np.array([2 ** 0, 2 ** (1.0 / 3.0), 2 ** (2.0 / 3.0)])
+        self.std = np.array([0.1, 0.1, 0.2, 0.2])
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+        results = []
+        for identifier, loc_pred, cls_pred, meta in zip(
+                identifiers, raw_outputs[self.loc_out], raw_outputs[self.cls_out], frame_meta
+        ):
+            _, _, h, w = next(iter(meta.get('input_shape', {'data': (1, 3, 800, 800)}).values()))
+            anchors = self.create_anchors([w, h])
+            transformed_anchors = self.regress_boxes(anchors, loc_pred)
+            labels, scores = np.argmax(cls_pred, axis=1), np.max(cls_pred, axis=1)
+            scores_mask = np.reshape(scores > 0.05, -1)
+            transformed_anchors = transformed_anchors[scores_mask, :]
+            x_mins, y_mins, x_maxs, y_maxs = transformed_anchors.T
+            results.append(DetectionPrediction(
+                identifier, labels[scores_mask], scores[scores_mask], x_mins / w, y_mins / h, x_maxs / w, y_maxs / h
+            ))
+
+        return results
+
+    def create_anchors(self, input_shape):
+        def _generate_anchors(base_size=16):
+            """
+            Generate anchor (reference) windows by enumerating aspect ratios X
+            scales w.r.t. a reference window.
+            """
+            num_anchors = len(self.ratios) * len(self.scales)
+            # initialize output anchors
+            anchors = np.zeros((num_anchors, 4))
+            # scale base_size
+            anchors[:, 2:] = base_size * np.tile(self.scales, (2, len(self.ratios))).T
+            # compute areas of anchors
+            areas = anchors[:, 2] * anchors[:, 3]
+            # correct for ratios
+            anchors[:, 2] = np.sqrt(areas / np.repeat(self.ratios, len(self.scales)))
+            anchors[:, 3] = anchors[:, 2] * np.repeat(self.ratios, len(self.scales))
+            # transform from (x_ctr, y_ctr, w, h) -> (x1, y1, x2, y2)
+            anchors[:, 0::2] -= np.tile(anchors[:, 2] * 0.5, (2, 1)).T
+            anchors[:, 1::2] -= np.tile(anchors[:, 3] * 0.5, (2, 1)).T
+
+            return anchors
+
+        def _shift(shape, stride, anchors):
+            shift_x = (np.arange(0, shape[1]) + 0.5) * stride
+            shift_y = (np.arange(0, shape[0]) + 0.5) * stride
+            shift_x, shift_y = np.meshgrid(shift_x, shift_y)
+
+            shifts = np.vstack((
+                shift_x.ravel(), shift_y.ravel(),
+                shift_x.ravel(), shift_y.ravel()
+            )).transpose()
+            a = anchors.shape[0]
+            k = shifts.shape[0]
+            all_anchors = (anchors.reshape((1, a, 4)) + shifts.reshape((1, k, 4)).transpose((1, 0, 2)))
+            all_anchors = all_anchors.reshape((k * a, 4))
+
+            return all_anchors
+
+        image_shapes = [(np.array(input_shape) + 2 ** x - 1) // (2 ** x) for x in self.pyramid_levels]
+        # compute anchors over all pyramid levels
+        all_anchors = np.zeros((0, 4)).astype(np.float32)
+        for idx, _ in enumerate(self.pyramid_levels):
+            anchors = _generate_anchors(base_size=self.sizes[idx])
+            shifted_anchors = _shift(image_shapes[idx], self.strides[idx], anchors)
+            all_anchors = np.append(all_anchors, shifted_anchors, axis=0)
+
+        return all_anchors
+
+    def regress_boxes(self, boxes, deltas):
+        widths = boxes[:, 2] - boxes[:, 0]
+        heights = boxes[:, 3] - boxes[:, 1]
+        ctr_x = boxes[:, 0] + 0.5 * widths
+        ctr_y = boxes[:, 1] + 0.5 * heights
+
+        dx = deltas[:, 0] * self.std[0]
+        dy = deltas[:, 1] * self.std[1]
+        dw = deltas[:, 2] * self.std[2]
+        dh = deltas[:, 3] * self.std[3]
+
+        pred_ctr_x = ctr_x + dx * widths
+        pred_ctr_y = ctr_y + dy * heights
+        pred_w = np.exp(dw) * widths
+        pred_h = np.exp(dh) * heights
+
+        pred_boxes_x1 = pred_ctr_x - 0.5 * pred_w
+        pred_boxes_y1 = pred_ctr_y - 0.5 * pred_h
+        pred_boxes_x2 = pred_ctr_x + 0.5 * pred_w
+        pred_boxes_y2 = pred_ctr_y + 0.5 * pred_h
+
+        pred_boxes = np.stack([pred_boxes_x1, pred_boxes_y1, pred_boxes_x2, pred_boxes_y2], axis=1)
+
+        return pred_boxes
+
+
+class FCOSPersonAdapter(Adapter):
+    """
+    Class for converting output of FCOS model to DetectionPrediction representation
+    """
+    __provider__ = 'fcos_person'
+    prediction_types = (DetectionPrediction, )
+
+    def validate_config(self):
+        super().validate_config(on_extra_argument=ConfigValidator.ERROR_ON_EXTRA_ARGUMENT)
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'output_blob': StringField(optional=True, default=None, description="Output blob name."),
+            'scale': NumberField(optional=True, default=1.0, description="Scale factor for bboxes."),
+        })
+
+        return parameters
+
+    def configure(self):
+        self.out_blob_name = self.get_value_from_config('output_blob')
+        self.scale = self.get_value_from_config('scale')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        """
+        Args:
+            identifiers: list of input data identifiers
+            raw: output of model
+        Returns:
+            list of DetectionPrediction objects
+        """
+
+        if self.out_blob_name is None:
+            self.out_blob_name = self.output_blob
+
+        prediction_batch = self._extract_predictions(raw, frame_meta)[self.out_blob_name]
+
+        result = []
+        for identifier in identifiers:
+            prediction_mask = np.where(prediction_batch[:, -1] > 0.0)
+            valid_detections = prediction_batch[prediction_mask]
+
+            bboxes = self.scale * valid_detections[:, :-1]
+            scores = valid_detections[:, -1]
+            labels = np.ones([len(scores)], dtype=np.int32)
+
+            result.append(DetectionPrediction(identifier, labels, scores, *zip(*bboxes)))
+
+        return result
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/image_processing.py b/tools/accuracy_checker/accuracy_checker/adapters/image_processing.py
index d7385d26d79..3c064e9d582 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/image_processing.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/image_processing.py
@@ -15,12 +15,17 @@
 """
 
 import cv2
-from PIL import Image
 import numpy as np
 
 from ..adapters import Adapter
 from ..representation import SuperResolutionPrediction
-from ..config import ConfigValidator, BoolField
+from ..config import ConfigValidator, BoolField, BaseField, ConfigError
+from ..utils import get_or_parse_value
+from ..preprocessor import Normalize
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
 
 
 class SuperResolutionAdapter(Adapter):
@@ -33,6 +38,16 @@ def parameters(cls):
         parameters.update({
             'reverse_channels': BoolField(
                 optional=True, default=False, description="Allow switching output image channels e.g. RGB to BGR"
+            ),
+            'mean': BaseField(
+                optional=True, default=0,
+                description='The value which should be added to prediction pixels for scaling to range [0, 255]'
+                            '(usually it is the same mean value which subtracted in preprocessing step))'
+            ),
+            'std':  BaseField(
+                optional=True, default=255,
+                description='The value on which prediction pixels should be multiplied for scaling to range '
+                            '[0, 255] (usually it is the same scale (std) used in preprocessing step))'
             )
         })
         return parameters
@@ -42,17 +57,26 @@ def validate_config(self):
 
     def configure(self):
         self.reverse_channels = self.get_value_from_config('reverse_channels')
+        self.mean = get_or_parse_value(self.launcher_config.get('mean', 0), Normalize.PRECOMPUTED_MEANS)
+        self.std = get_or_parse_value(self.launcher_config.get('std', 255), Normalize.PRECOMPUTED_STDS)
+
+        if not (len(self.mean) == 3 or len(self.mean) == 1):
+            raise ConfigError('mean should be one value or comma-separated list channel-wise values')
+
+        if not (len(self.std) == 3 or len(self.std) == 1):
+            raise ConfigError('std should be one value or comma-separated list channel-wise values')
 
     def process(self, raw, identifiers=None, frame_meta=None):
         result = []
         raw_outputs = self._extract_predictions(raw, frame_meta)
         for identifier, img_sr in zip(identifiers, raw_outputs[self.output_blob]):
-            img_sr *= 255
+            img_sr *= self.std
+            img_sr += self.mean
             img_sr = np.clip(img_sr, 0., 255.)
             img_sr = img_sr.transpose((1, 2, 0)).astype(np.uint8)
             if self.reverse_channels:
                 img_sr = cv2.cvtColor(img_sr, cv2.COLOR_BGR2RGB)
-                img_sr = Image.fromarray(img_sr, 'RGB')
+                img_sr = Image.fromarray(img_sr, 'RGB') if Image is not None else img_sr
                 img_sr = np.array(img_sr).astype(np.uint8)
             result.append(SuperResolutionPrediction(identifier, img_sr))
 
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn.py b/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn.py
index 6861e5288dd..a976fa2d0d1 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn.py
@@ -16,9 +16,14 @@
 
 import cv2
 import numpy as np
+try:
+    import pycocotools.mask as mask_util
+except ImportError:
+    mask_util = None
 from .adapter import Adapter
 from ..config import StringField, ConfigError
 from ..representation import CoCocInstanceSegmentationPrediction, DetectionPrediction, ContainerPrediction
+from ..postprocessor import FRCNNPostprocessingBboxResize
 from ..utils import contains_all
 
 
@@ -27,11 +32,9 @@ class MaskRCNNAdapter(Adapter):
 
     def __init__(self, launcher_config, label_map=None, output_blob=None):
         super().__init__(launcher_config, label_map, output_blob)
-        try:
-            import pycocotools.mask as mask_util
-            self.encoder = mask_util.encode
-        except ImportError:
+        if mask_util is None:
             raise ImportError('pycocotools is not installed. Please install it before using mask_rcnn adapter.')
+        self.encoder = mask_util.encode
 
     @classmethod
     def parameters(cls):
@@ -162,10 +165,18 @@ def _process_pytorch_outputs(self, raw_outputs, identifiers, frame_meta):
             boxes[:, 1::2] /= im_scale_y
             classes = classes.astype(np.uint32)
             masks = []
-            for box, cls, raw_mask in zip(boxes, classes, raw_masks):
-                raw_cls_mask = raw_mask[cls, ...]
+            raw_mask_for_all_classes = np.shape(raw_masks)[1] != len(identifiers)
+            if raw_mask_for_all_classes:
+                per_obj_raw_masks = []
+                for cls, raw_mask in zip(classes, raw_masks):
+                    per_obj_raw_masks.append(raw_mask[cls, ...])
+            else:
+                per_obj_raw_masks = np.squeeze(raw_masks, axis=1)
+
+            for box, raw_cls_mask in zip(boxes, per_obj_raw_masks):
                 mask = self.segm_postprocess(box, raw_cls_mask, *original_image_size, True, True)
                 masks.append(mask)
+
             x_mins, y_mins, x_maxs, y_maxs = boxes.T
             detection_prediction = DetectionPrediction(identifier, classes, scores, x_mins, y_mins, x_maxs, y_maxs)
             instance_segmentation_prediction = CoCocInstanceSegmentationPrediction(identifier, masks, classes, scores)
@@ -191,6 +202,7 @@ def _process_detection_output(self, raw_outputs, identifiers, frame_meta):
 
         for batch_index, identifier in enumerate(identifiers):
             image_size = frame_meta[batch_index]['image_size'][:2]
+            coeff_x, coeff_y = FRCNNPostprocessingBboxResize.get_coeff_x_y_from_metadata(frame_meta[batch_index])
             prediction_box_mask = np.where(detections_boxes[:, 0] == batch_index)
             filtered_detections_boxes = detections_boxes[prediction_box_mask]
             filtered_detections_boxes = filtered_detections_boxes[:, 1::]
@@ -200,8 +212,8 @@ def _process_detection_output(self, raw_outputs, identifiers, frame_meta):
             for box, masks in zip(filtered_detections_boxes, filtered_masks):
                 label = box[0]
                 cls_mask = masks[int(label)-1, ...]
-                box[2::2] *= image_size[1]
-                box[3::2] *= image_size[0]
+                box[2::2] *= coeff_x
+                box[3::2] *= coeff_y
                 cls_mask = self.segm_postprocess(box[2:], cls_mask, *image_size, True, True)
                 instance_masks.append(cls_mask)
             instance_segmentation_prediction = CoCocInstanceSegmentationPrediction(
@@ -220,7 +232,7 @@ def segm_postprocess(self, box, raw_cls_mask, im_h, im_w, full_image_mask=False,
         raw_cls_mask = np.pad(raw_cls_mask, ((1, 1), (1, 1)), 'constant', constant_values=0)
         extended_box = self.expand_boxes(box[np.newaxis, :], raw_cls_mask.shape[0] / (raw_cls_mask.shape[0] - 2.0))[0]
         extended_box = extended_box.astype(int)
-        w, h = np.maximum(extended_box[2:] - extended_box[:2] + 1, 1)
+        w, h = np.maximum(extended_box[2:] - extended_box[:2] + 1, 1)  # pylint: disable=E0633
         x0, y0 = np.clip(extended_box[:2], a_min=0, a_max=[im_w, im_h])
         x1, y1 = np.clip(extended_box[2:] + 1, a_min=0, a_max=[im_w, im_h])
 
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn_with_text.py b/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn_with_text.py
new file mode 100644
index 00000000000..77cfff36859
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/adapters/mask_rcnn_with_text.py
@@ -0,0 +1,142 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import cv2
+import numpy as np
+
+from .mask_rcnn import MaskRCNNAdapter
+from ..config import StringField, NumberField
+from ..representation import TextDetectionPrediction
+
+
+class MaskRCNNWithTextAdapter(MaskRCNNAdapter):
+    __provider__ = 'mask_rcnn_with_text'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'classes_out': StringField(
+                description="Name of output layer with information about classes.",
+                optional=False
+            ),
+            'scores_out': StringField(
+                description="Name of output layer with bbox scores.",
+                optional=False
+            ),
+            'boxes_out': StringField(
+                description="Name of output layer with bboxes.",
+                optional=False
+            ),
+            'raw_masks_out': StringField(
+                description='Name of output layer with raw instances masks.',
+                optional=False
+            ),
+            'texts_out': StringField(
+                description='Name of output layer with texts.',
+                optional=False
+            ),
+            'confidence_threshold': NumberField(
+                description='Confidence threshold that is used to filter out detected instances.',
+                optional=False
+            ),
+        })
+
+        return parameters
+
+    def configure(self):
+        self.classes_out = self.get_value_from_config('classes_out')
+        self.scores_out = self.get_value_from_config('scores_out')
+        self.boxes_out = self.get_value_from_config('boxes_out')
+        self.num_detections_out = self.get_value_from_config('num_detections_out')
+        self.raw_masks_out = self.get_value_from_config('raw_masks_out')
+        self.texts_out = self.get_value_from_config('texts_out')
+        self.confidence_threshold = self.get_value_from_config('confidence_threshold')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+
+        classes = raw_outputs[self.classes_out]
+        valid_detections_mask = classes > 0
+        classes = classes[valid_detections_mask]
+        boxes = raw_outputs[self.boxes_out][valid_detections_mask]
+        scores = raw_outputs[self.scores_out][valid_detections_mask]
+        raw_masks = raw_outputs[self.raw_masks_out][valid_detections_mask]
+        texts = raw_outputs[self.texts_out][valid_detections_mask]
+
+        confidence_filter = scores > self.confidence_threshold
+        classes = classes[confidence_filter]
+        boxes = boxes[confidence_filter]
+        texts = texts[confidence_filter]
+        raw_masks = raw_masks[confidence_filter]
+
+        results = []
+
+        for identifier, image_meta in zip(identifiers, frame_meta):
+            original_image_size = image_meta['image_size'][:2]
+            if 'scale_x' in image_meta and 'scale_y' in image_meta:
+                im_scale_x = image_meta['scale_x']
+                im_scale_y = image_meta['scale_y']
+            else:
+                processed_image_size = next(image_meta['input_shape'])[1:]
+                im_scale_y = processed_image_size[0] / original_image_size[0]
+                im_scale_x = processed_image_size[1] / original_image_size[1]
+            boxes[:, 0::2] /= im_scale_x
+            boxes[:, 1::2] /= im_scale_y
+            classes = classes.astype(np.uint32)
+            masks = []
+            raw_mask_for_all_classes = np.shape(raw_masks)[1] != len(identifiers)
+            if raw_mask_for_all_classes:
+                per_obj_raw_masks = []
+                for cls, raw_mask in zip(classes, raw_masks):
+                    per_obj_raw_masks.append(raw_mask[cls, ...])
+            else:
+                per_obj_raw_masks = np.squeeze(raw_masks, axis=1)
+
+            for box, raw_cls_mask in zip(boxes, per_obj_raw_masks):
+                mask = self.segm_postprocess(box, raw_cls_mask, *original_image_size, True, False)
+                masks.append(mask)
+
+            rectangles = self.masks_to_rects(masks)
+
+            results.append(
+                TextDetectionPrediction(identifier, points=rectangles, description=texts))
+
+        return results
+
+    @staticmethod
+    def masks_to_rects(masks):
+        rects = []
+        for mask in masks:
+            decoded_mask = mask
+            contours = cv2.findContours(decoded_mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)[-2]
+
+            areas = []
+            boxes = []
+            for contour in contours:
+                area = cv2.contourArea(contour)
+                areas.append(area)
+
+                rect = cv2.minAreaRect(contour)
+                box = cv2.boxPoints(rect)
+                box = np.int0(box)
+                boxes.append(box)
+
+            if areas:
+                i = np.argmax(areas)
+                rects.append(boxes[i])
+
+        return rects
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/nlp.py b/tools/accuracy_checker/accuracy_checker/adapters/nlp.py
index b38efcac0c0..639b60eec70 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/nlp.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/nlp.py
@@ -1,8 +1,8 @@
 import re
 import numpy as np
 from .adapter import Adapter
-from ..representation import MachineTranslationPrediction
-from ..config import PathField, NumberField
+from ..representation import MachineTranslationPrediction, QuestionAnsweringPrediction, ClassificationPrediction
+from ..config import PathField, NumberField, StringField
 from ..utils import read_txt
 
 
@@ -42,9 +42,7 @@ def parameters(cls):
 
     def configure(self):
         vocab_file = self.get_value_from_config('vocabulary_file')
-        self.encoding_vocab = {
-            idx: word for idx, word in enumerate(read_txt(vocab_file, encoding='utf-8'))
-        }
+        self.encoding_vocab = dict(enumerate(read_txt(vocab_file, encoding='utf-8')))
         self.eos_index = self.get_value_from_config('eos_index')
         self.subword_option = vocab_file.name.split('.')[1] if len(vocab_file.name.split('.')) > 1 else None
 
@@ -71,3 +69,63 @@ def process(self, raw, identifiers=None, frame_meta=None):
             results.append(MachineTranslationPrediction(identifier, _clean(encoded_words, self.subword_option)))
 
         return results
+
+
+class QuestionAnsweringAdapter(Adapter):
+    __provider__ = 'bert_question_answering'
+    prediction_types = (QuestionAnsweringPrediction, )
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        predictions = self._extract_predictions(raw, frame_meta)[self.output_blob]
+        result = []
+        batch_size, seq_length, hidden_size = predictions.shape
+        output_weights = np.random.normal(scale=0.02, size=(2, hidden_size))
+        output_bias = np.zeros(2)
+        prediction_matrix = predictions.reshape((batch_size * seq_length, hidden_size))
+        predictions = np.matmul(prediction_matrix, output_weights.T)
+        predictions = predictions + output_bias
+        predictions = predictions.reshape((batch_size, seq_length, 2))
+        for identifier, prediction in zip(identifiers, predictions):
+            prediction = np.transpose(prediction, (1, 0))
+            result.append(QuestionAnsweringPrediction(identifier, prediction[0], prediction[1]))
+
+        return result
+
+
+class BertTextClassification(Adapter):
+    __provider__ = 'bert_classification'
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            "num_classes": NumberField(value_type=int, min_value=1, description='number of classes for classification'),
+            'classification_out': StringField(
+                optional=True,
+                description='Classification output layer name. If not provided, first output will be used.'
+            )
+        })
+
+        return params
+
+    def configure(self):
+        self.num_classes = self.get_value_from_config('num_classes')
+        self.classification_out = self.get_value_from_config('classification_out')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        if self.classification_out is None:
+            self.classification_out = self.output_blob
+        outputs = self._extract_predictions(raw, frame_meta)[self.classification_out]
+        if outputs.shape[1] != self.num_classes:
+            _, hidden_size = outputs.shape
+            output_weights = np.random.normal(scale=0.02, size=(self.num_classes, hidden_size))
+            output_bias = np.zeros(self.num_classes)
+            predictions = np.matmul(outputs, output_weights.T)
+            predictions += output_bias
+        else:
+            predictions = outputs
+        result = []
+        for identifier, output in zip(identifiers, predictions):
+            result.append(ClassificationPrediction(identifier, output))
+
+        return result
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation.py b/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation.py
index cd02822ff52..4b5a03092e7 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation.py
@@ -21,7 +21,7 @@
 import numpy as np
 
 from ..adapters import Adapter
-from ..config import ConfigValidator, StringField
+from ..config import ConfigValidator, StringField, ConfigError
 from ..representation import PoseEstimationPrediction
 
 
@@ -43,9 +43,12 @@ def parameters(cls):
         parameters = super().parameters()
         parameters.update({
             'part_affinity_fields_out': StringField(
-                description="Name of output layer with keypoints pairwise relations (part affinity fields)."
+                description="Name of output layer with keypoints pairwise relations (part affinity fields).",
+                optional=True
+            ),
+            'keypoints_heatmap_out': StringField(
+                description="Name of output layer with keypoints heatmaps.", optional=True
             ),
-            'keypoints_heatmap_out': StringField(description="Name of output layer with keypoints heatmaps."),
         })
 
         return parameters
@@ -56,14 +59,29 @@ def validate_config(self):
     def configure(self):
         self.part_affinity_fields = self.get_value_from_config('part_affinity_fields_out')
         self.keypoints_heatmap = self.get_value_from_config('keypoints_heatmap_out')
+        self.concat_out = self.part_affinity_fields is None and self.keypoints_heatmap is None
+        if not self.concat_out:
+            contains_both = self.part_affinity_fields is not None and self.keypoints_heatmap is not None
+            if not contains_both:
+                raise ConfigError(
+                    'human_pose_estimation adapter should contains both: keypoints_heatmap_out '
+                    'and part_affinity_fields_out or not contain them at all (in single output model case)'
+                )
 
     def process(self, raw, identifiers=None, frame_meta=None):
         result = []
         raw_outputs = self._extract_predictions(raw, frame_meta)
-        raw_output = zip(
-            identifiers, raw_outputs[self.keypoints_heatmap],
-            raw_outputs[self.part_affinity_fields], frame_meta
-        )
+        if not self.concat_out:
+            raw_output = zip(
+                identifiers, raw_outputs[self.keypoints_heatmap],
+                raw_outputs[self.part_affinity_fields], frame_meta
+            )
+        else:
+            concat_out = raw_outputs[self.output_blob]
+            keypoints_num = concat_out.shape[1] // 3
+            keypoints_heat_map = concat_out[:, :keypoints_num, :]
+            pafs = concat_out[:, keypoints_num:, :]
+            raw_output = zip(identifiers, keypoints_heat_map, pafs, frame_meta)
         for identifier, heatmap, paf, meta in raw_output:
             height, width, _ = meta['image_size']
             heatmap_avg = np.zeros((height, width, 19), dtype=np.float32)
@@ -96,6 +114,7 @@ def process(self, raw, identifiers=None, frame_meta=None):
     @staticmethod
     def find_peaks(heatmap, all_peaks, prev_peak_counter):
         heatmap[heatmap < 0.1] = 0
+        heatmap[np.isnan(heatmap)] = 0
         map_aug = np.zeros((heatmap.shape[0] + 2, heatmap.shape[1] + 2))
         map_left = np.zeros(map_aug.shape)
         map_right = np.zeros(map_aug.shape)
@@ -337,3 +356,61 @@ def get_poses(subset, candidate):
         scores = np.array(scores)
 
         return persons_keypoints_x, persons_keypoints_y, persons_keypoints_v, scores
+
+
+class SingleHumanPoseAdapter(Adapter):
+    __provider__ = 'single_human_pose_estimation'
+    prediction_types = (PoseEstimationPrediction, )
+
+    def validate_config(self):
+        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        result = []
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+
+        outputs_batch = raw_outputs[self.output_blob]
+        for i, heatmaps in enumerate(outputs_batch):
+            heatmaps = np.transpose(heatmaps, (1, 2, 0))
+            sum_score = 0
+            sum_score_thr = 0
+            scores = []
+            x_values = []
+            y_values = []
+            num_kp_thr = 0
+            vis = [1] * outputs_batch.shape[1]
+            for kpt_idx in range(outputs_batch.shape[1]):
+                score, coord = self.extract_keypoints(heatmaps[:, :, kpt_idx])
+                scores.append(score)
+                x, y = self.affine_transform(coord, frame_meta[0]['rev_trans'])
+                x_values.append(x)
+                y_values.append(y)
+                if score > 0.2:
+                    sum_score_thr += score
+                    num_kp_thr += 1
+                sum_score += score
+            if num_kp_thr != 0:
+                pose_score = sum_score_thr / num_kp_thr
+            else:
+                pose_score = sum_score / outputs_batch.shape[1]
+            result.append(PoseEstimationPrediction(identifiers[i], np.array([x_values]),
+                                                   np.array([y_values]), np.array([vis]), np.array([pose_score])))
+
+        return result
+
+
+    @staticmethod
+    def extract_keypoints(heatmap, min_confidence=-100):
+        ind = np.unravel_index(np.argmax(heatmap, axis=None), heatmap.shape)
+        if heatmap[ind] < min_confidence:
+            ind = (-1, -1)
+        else:
+            ind = (int(ind[1]), int(ind[0]))
+        return heatmap[ind[1]][ind[0]], ind
+
+
+    @staticmethod
+    def affine_transform(pt, t):
+        new_pt = np.array([pt[0], pt[1], 1.])
+        new_pt = np.dot(t, new_pt)
+        return new_pt[:2]
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation_3d.py b/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation_3d.py
new file mode 100644
index 00000000000..9cd8e1ad3e5
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/adapters/pose_estimation_3d.py
@@ -0,0 +1,259 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from collections import OrderedDict
+
+import cv2
+import numpy as np
+
+from ..adapters import Adapter
+from ..adapters.pose_estimation import HumanPoseAdapter
+from ..config import ConfigValidator, StringField
+from ..representation import PoseEstimationPrediction, PoseEstimation3dPrediction
+
+AVG_PERSON_HEIGHT = 180
+
+# pelvis (body center) is missing, id == 2
+map_id_to_panoptic = [1, 0, 9, 10, 11, 3, 4, 5, 12, 13, 14, 6, 7, 8, 15, 16, 17, 18]
+
+limbs = [[18, 17, 1],
+         [16, 15, 1],
+         [5, 4, 3],
+         [8, 7, 6],
+         [11, 10, 9],
+         [14, 13, 12]]
+
+
+class HumanPose3dAdapter(Adapter):
+    __provider__ = 'human_pose_estimation_3d'
+    prediction_types = (PoseEstimation3dPrediction,)
+
+    def __init__(self, launcher_config, label_map=None, output_blob=None):
+        super().__init__(launcher_config, label_map, output_blob)
+        launcher_2d_config = OrderedDict([
+            ('type', HumanPoseAdapter.__provider__),
+            ('part_affinity_fields_out', launcher_config['part_affinity_fields_out']),
+            ('keypoints_heatmap_out', launcher_config['keypoints_heatmap_out'])])
+        self.pose_adapter = HumanPoseAdapter(launcher_2d_config, label_map, output_blob)
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'features_3d_out': StringField(description="Name of output layer with 3D features."),
+            'keypoints_heatmap_out': StringField(description="Name of output layer with keypoints heatmaps."),
+            'part_affinity_fields_out': StringField(
+                description="Name of output layer with keypoints pairwise relations (part affinity fields)."
+            )
+        })
+
+        return parameters
+
+    def validate_config(self):
+        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
+
+    def configure(self):
+        self.features_3d = self.get_value_from_config('features_3d_out')
+        self.part_affinity_fields = self.get_value_from_config('part_affinity_fields_out')
+        self.keypoints_heatmap = self.get_value_from_config('keypoints_heatmap_out')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        result = []
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+        raw_output = zip(
+            identifiers, raw_outputs[self.features_3d], raw_outputs[self.keypoints_heatmap],
+            raw_outputs[self.part_affinity_fields], frame_meta
+        )
+        for identifier, features, heatmap, paf, meta in raw_output:
+            poses_2d = self._extract_poses_2d(heatmap, paf, meta, identifier)
+            if poses_2d.size == 0:
+                result.append(PoseEstimation3dPrediction(identifier, poses_2d.x_values, poses_2d.y_values))
+                continue
+
+            height, width, _ = meta['image_size']
+            scale_y = height / features.shape[1]
+            scale_x = width / features.shape[2]
+            panoptic_poses_3d, translations, panoptic_poses_2d = HumanPose3dAdapter._parse_poses(
+                features, poses_2d, scale_y, scale_x, 1 / scale_x
+            )
+            frame_result = PoseEstimation3dPrediction(
+                identifier, panoptic_poses_2d[:, 0:-1:3], panoptic_poses_2d[:, 1:-1:3], panoptic_poses_2d[:, 2:-1:3],
+                panoptic_poses_2d[:, -1], x_3d_values=panoptic_poses_3d[:, 0::4],
+                y_3d_values=panoptic_poses_3d[:, 1::4], z_3d_values=panoptic_poses_3d[:, 2::4],
+                translations=translations
+            )
+            result.append(frame_result)
+
+        return result
+
+    def _extract_poses_2d(self, heatmap, paf, meta, identifier):
+        height, width, _ = meta['image_size']
+        heatmap_avg = np.zeros((height, width, 19), dtype=np.float32)
+        paf_avg = np.zeros((height, width, 38), dtype=np.float32)
+        pad = meta.get('padding', [0, 0, 0, 0])
+
+        heatmap = np.transpose(np.squeeze(heatmap), (1, 2, 0))
+        heatmap = cv2.resize(heatmap, (0, 0), fx=8, fy=8, interpolation=cv2.INTER_CUBIC)
+        heatmap = heatmap[pad[0]:heatmap.shape[0] - pad[2], pad[1]:heatmap.shape[1] - pad[3]:, :]
+        heatmap = cv2.resize(heatmap, (width, height), interpolation=cv2.INTER_CUBIC)
+        heatmap_avg = heatmap_avg + heatmap
+
+        paf = np.transpose(np.squeeze(paf), (1, 2, 0))
+        paf = cv2.resize(paf, (0, 0), fx=8, fy=8, interpolation=cv2.INTER_CUBIC)
+        paf = paf[pad[0]:paf.shape[0] - pad[2], pad[1]:paf.shape[1] - pad[3], :]
+        paf = cv2.resize(paf, (width, height), interpolation=cv2.INTER_CUBIC)
+        paf_avg = paf_avg + paf
+
+        peak_counter = 0
+        all_peaks = []
+        for part in range(0, 18):  # 19th for bg
+            peak_counter += self.pose_adapter.find_peaks(heatmap_avg[:, :, part], all_peaks, peak_counter)
+
+        subset, candidate = self.pose_adapter.group_peaks(all_peaks, paf_avg)
+        poses_2d = PoseEstimationPrediction(identifier, *HumanPose3dAdapter._get_poses(subset, candidate))
+        return poses_2d
+
+    @staticmethod
+    def _get_poses(subset, candidate):
+        persons_keypoints_x, persons_keypoints_y, persons_keypoints_v = [], [], []
+        scores = []
+        num_kpt = 18
+        for subset_element in subset:
+            if subset_element.size == 0:
+                continue
+            keypoints_x, keypoints_y, keypoints_v = [0] * num_kpt, [0] * num_kpt, [0] * num_kpt
+            person_score = subset_element[-2]
+            position_id = -1
+            for keypoint_id in subset_element[:-2]:
+                position_id += 1
+
+                cx, cy, visibility = 0, 0, 0  # Keypoint not found
+                if keypoint_id != -1:
+                    cx, cy = candidate[keypoint_id.astype(int), 0:2]
+                    cx = cx - 0.5 + 1  # +1 for matlab consistency, coords start from 1
+                    cy = cy - 0.5 + 1
+                    visibility = 1
+                keypoints_x[position_id] = cx
+                keypoints_y[position_id] = cy
+                keypoints_v[position_id] = visibility
+
+            scores.append(person_score * max(0, (subset_element[-1] - 1)))  # -1 for Neck
+            persons_keypoints_x.append(keypoints_x)
+            persons_keypoints_y.append(keypoints_y)
+            persons_keypoints_v.append(keypoints_v)
+
+        persons_keypoints_x = np.array(persons_keypoints_x)
+        persons_keypoints_y = np.array(persons_keypoints_y)
+        persons_keypoints_v = np.array(persons_keypoints_v)
+        scores = np.array(scores)
+
+        return persons_keypoints_x, persons_keypoints_y, persons_keypoints_v, scores
+
+    @staticmethod
+    def _get_root_relative_poses(features, found_poses_2d):
+        poses_2d = []
+        num_kpt_panoptic = 19
+        num_kpt = 18
+        for pose_id in range(found_poses_2d.size):
+            if found_poses_2d.visibility[pose_id, 1] == 0:  # skip pose if does not found neck
+                continue
+            # just reordering
+            pose_2d = np.ones(num_kpt_panoptic * 3 + 1, dtype=np.float32) * -1  # +1 for pose confidence
+            for kpt_id in range(num_kpt):
+                if found_poses_2d.visibility[pose_id, kpt_id] != 0:
+                    pose_2d[map_id_to_panoptic[kpt_id] * 3] = found_poses_2d.x_values[pose_id, kpt_id]
+                    pose_2d[map_id_to_panoptic[kpt_id] * 3 + 1] = found_poses_2d.y_values[pose_id, kpt_id]
+                    pose_2d[map_id_to_panoptic[kpt_id] * 3 + 2] = found_poses_2d.visibility[pose_id, kpt_id]
+            pose_2d[-1] = found_poses_2d.scores[pose_id]
+            poses_2d.append(pose_2d)
+        poses_2d = np.array(poses_2d)
+
+        keypoint_treshold = 0.1
+        poses_3d = np.ones((poses_2d.shape[0], num_kpt_panoptic * 4), dtype=np.float32) * -1
+        for pose_id in range(poses_3d.shape[0]):
+            pose_3d = poses_3d[pose_id]
+            if poses_2d[pose_id, 2] <= keypoint_treshold:
+                continue
+            neck_2d = poses_2d[pose_id, 0:2].astype(np.int32)
+            # read all pose coordinates at neck location
+            for kpt_id in range(num_kpt_panoptic):
+                map_3d = features[kpt_id * 3:(kpt_id + 1) * 3]
+                pose_3d[kpt_id * 4] = map_3d[0, neck_2d[1], neck_2d[0]]
+                pose_3d[kpt_id * 4 + 1] = map_3d[1, neck_2d[1], neck_2d[0]]
+                pose_3d[kpt_id * 4 + 2] = map_3d[2, neck_2d[1], neck_2d[0]]
+                pose_3d[kpt_id * 4 + 3] = poses_2d[pose_id, kpt_id * 3 + 2]
+
+            # refine keypoints coordinates at corresponding limbs locations
+            for limb in limbs:
+                for kpt_id_from in limb:
+                    if poses_2d[pose_id, kpt_id_from * 3 + 2] <= keypoint_treshold:
+                        continue
+                    for kpt_id_where in limb:
+                        kpt_from_2d = poses_2d[pose_id, kpt_id_from * 3: kpt_id_from * 3 + 2].astype(np.int32)
+                        map_3d = features[kpt_id_where * 3:(kpt_id_where + 1) * 3]
+                        pose_3d[kpt_id_where * 4] = map_3d[0, kpt_from_2d[1], kpt_from_2d[0]]
+                        pose_3d[kpt_id_where * 4 + 1] = map_3d[1, kpt_from_2d[1], kpt_from_2d[0]]
+                        pose_3d[kpt_id_where * 4 + 2] = map_3d[2, kpt_from_2d[1], kpt_from_2d[0]]
+                    break
+
+        poses_3d[:, 0::4] *= AVG_PERSON_HEIGHT
+        poses_3d[:, 1::4] *= AVG_PERSON_HEIGHT
+        poses_3d[:, 2::4] *= AVG_PERSON_HEIGHT
+        return poses_3d, poses_2d
+
+    @staticmethod
+    def _parse_poses(features, found_poses_2d, scale_y, scale_x, fx):
+        # map 2d coordinates from image to features space
+        found_poses_2d.x_values[found_poses_2d.visibility > 0] /= scale_x
+        found_poses_2d.y_values[found_poses_2d.visibility > 0] /= scale_y
+        poses_3d, poses_2d = HumanPose3dAdapter._get_root_relative_poses(features, found_poses_2d)
+
+        features_shape = features.shape
+        translations = []
+        # calculate translations
+        for pose_id in range(poses_3d.shape[0]):
+            pose_3d = poses_3d[pose_id].reshape((-1, 4)).transpose()
+            pose_2d = poses_2d[pose_id][:-1].reshape((-1, 3)).transpose()
+            num_valid = np.count_nonzero(pose_2d[2] != -1)
+            pose_3d_valid = np.zeros((3, num_valid), dtype=np.float32)
+            pose_2d_valid = np.zeros((2, num_valid), dtype=np.float32)
+            valid_id = 0
+            for kpt_id in range(pose_3d.shape[1]):
+                if pose_2d[2, kpt_id] == -1:
+                    continue
+                pose_3d_valid[:, valid_id] = pose_3d[0:3, kpt_id]
+                pose_2d_valid[:, valid_id] = pose_2d[0:2, kpt_id]
+                valid_id += 1
+            assert valid_id == num_valid
+
+            pose_2d_valid[0] = pose_2d_valid[0] - features_shape[2] / 2
+            pose_2d_valid[1] = pose_2d_valid[1] - features_shape[1] / 2
+            mean_3d = np.expand_dims(pose_3d_valid.mean(axis=1), axis=1)
+            mean_2d = np.expand_dims(pose_2d_valid.mean(axis=1), axis=1)
+            numerator = np.trace(np.dot((pose_3d_valid[:2, :] - mean_3d[:2, :]).transpose(),
+                                        pose_3d_valid[:2, :] - mean_3d[:2, :])).sum()
+            numerator = np.sqrt(numerator)
+            denominator = np.sqrt(np.trace(np.dot((pose_2d_valid[:2, :] - mean_2d[:2, :]).transpose(),
+                                                  pose_2d_valid[:2, :] - mean_2d[:2, :])).sum())
+            mean_2d = np.array([mean_2d[0, 0], mean_2d[1, 0], fx])
+            mean_3d = np.array([mean_3d[0, 0], mean_3d[1, 0], 0])
+            translation = numerator / denominator * mean_2d - mean_3d
+            translations.append(translation)
+
+        # map 2d coordinates back to image space
+        poses_2d[:, 0:-1:3] *= scale_x
+        poses_2d[:, 1:-1:3] *= scale_y
+        return poses_3d, np.array(translations, dtype=np.float32), poses_2d
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/segmentation.py b/tools/accuracy_checker/accuracy_checker/adapters/segmentation.py
index 32a030f5f47..10f4fbe5b49 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/segmentation.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/segmentation.py
@@ -17,7 +17,7 @@
 import numpy as np
 from ..adapters import Adapter
 from ..representation import SegmentationPrediction, BrainTumorSegmentationPrediction
-from ..config import ConfigValidator, BoolField
+from ..config import ConfigValidator, BoolField, ListField, NumberField
 
 
 class SegmentationAdapter(Adapter):
@@ -71,16 +71,67 @@ def _extract_predictions(self, outputs_list, meta):
         return {self.output_blob: restore_output}
 
 
+class SegmentationOneClassAdapter(Adapter):
+    __provider__ = 'segmentation_one_class'
+    prediction_types = (SegmentationPrediction, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'threshold': NumberField(
+                optional=True, value_type=float, min_value=0.0, default=0.5,
+                description='minimal probability threshold for separating predicted class from background'
+            )
+        })
+        return params
+
+    def configure(self):
+        self.threshold = self.get_value_from_config('threshold')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        result = []
+        frame_meta = frame_meta or [] * len(identifiers)
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+        for identifier, output in zip(identifiers, raw_outputs[self.output_blob]):
+            output = output > self.threshold
+            result.append(SegmentationPrediction(identifier, output))
+
+        return result
+
+
 class BrainTumorSegmentationAdapter(Adapter):
     __provider__ = 'brain_tumor_segmentation'
     prediction_types = (BrainTumorSegmentationPrediction, )
 
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'make_argmax': BoolField(
+                optional=True, default=False, description="Allows to apply argmax operation to output values."
+            ),
+            'label_order': ListField(
+                optional=True, default=[1, 2, 3], value_type=int, validate_values=True,
+                description="Specifies order of output labels, according to order of dataset labels"
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        self.argmax = self.get_value_from_config('make_argmax')
+        self.label_order = tuple(self.get_value_from_config('label_order'))
+
     def process(self, raw, identifiers=None, frame_meta=None):
         result = []
         frame_meta = frame_meta or [] * len(identifiers)
         raw_outputs = self._extract_predictions(raw, frame_meta)
         for identifier, output in zip(identifiers, raw_outputs[self.output_blob]):
-            result.append(BrainTumorSegmentationPrediction(identifier, output))
+            if self.argmax:
+                output = np.argmax(output, axis=0).astype(np.int8)
+                output = np.expand_dims(output, axis=0)
+            result.append(BrainTumorSegmentationPrediction(identifier, output, self.label_order))
 
         return result
 
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/text_detection.py b/tools/accuracy_checker/accuracy_checker/adapters/text_detection.py
index 05ffa80b55c..a5ddf322836 100644
--- a/tools/accuracy_checker/accuracy_checker/adapters/text_detection.py
+++ b/tools/accuracy_checker/accuracy_checker/adapters/text_detection.py
@@ -18,13 +18,16 @@
 
 import cv2
 import numpy as np
-from shapely.geometry import Polygon
 
 
 from ..adapters import Adapter
 from ..config import ConfigValidator, StringField, NumberField, BoolField, ConfigError
 from ..representation import TextDetectionPrediction, CharacterRecognitionPrediction
 from ..postprocessor import NMS
+try:
+    from shapely.geometry import Polygon
+except ImportError:
+    Polygon = None
 
 
 class TextDetectionAdapter(Adapter):
@@ -305,6 +308,8 @@ def configure(self):
         self.line_min_score = self.get_value_from_config('line_min_score')
         self.text_proposals_width = self.get_value_from_config('text_proposals_width')
         self.min_num_proposals = self.get_value_from_config('min_num_proposals')
+        if Polygon is None:
+            raise ValueError("east_text_detection adapter requires shapely, please install it")
         self.text_proposal_connector = TextProposalConnector()
 
     def process(self, raw, identifiers=None, frame_meta=None):
@@ -667,11 +672,9 @@ class LPRAdapter(Adapter):
     __provider__ = 'lpr'
     prediction_types = (CharacterRecognitionPrediction,)
 
-    def configure(self):
+    def process(self, raw, identifiers=None, frame_meta=None):
         if not self.label_map:
             raise ConfigError('LPR adapter requires dataset label map for correct decoding.')
-
-    def process(self, raw, identifiers=None, frame_meta=None):
         raw_output = self._extract_predictions(raw, frame_meta)
         predictions = raw_output[self.output_blob]
         result = []
@@ -714,16 +717,15 @@ def parameters(cls):
 
     def validate_config(self):
         super().validate_config(on_extra_argument=ConfigValidator.IGNORE_ON_EXTRA_ARGUMENT)
-
-    def configure(self):
-        if not self.label_map:
-            raise ConfigError('Beam Search Decoder requires dataset label map for correct decoding.')
-
         self.beam_size = self.get_value_from_config('beam_size')
-        self.blank_label = self.launcher_config.get('blank_label', len(self.label_map))
+        self.blank_label = self.launcher_config.get('blank_label')
         self.softmaxed_probabilities = self.get_value_from_config('softmaxed_probabilities')
 
     def process(self, raw, identifiers=None, frame_meta=None):
+        if not self.label_map:
+            raise ConfigError('Beam Search Decoder requires dataset label map for correct decoding.')
+        if self.blank_label is None:
+            self.blank_label = len(self.label_map)
         raw_output = self._extract_predictions(raw, frame_meta)
         output = raw_output[self.output_blob]
         output = np.swapaxes(output, 0, 1)
@@ -830,6 +832,8 @@ def configure(self):
         self.score_map_thresh = self.get_value_from_config('score_map_threshold')
         self.nms_thresh = self.get_value_from_config('nms_threshold')
         self.box_thresh = self.get_value_from_config('box_threshold')
+        if Polygon is None:
+            raise ValueError("east_text_detection adapter requires shapely, please install it")
 
     def process(self, raw, identifiers=None, frame_meta=None):
         raw_outputs = self._extract_predictions(raw, frame_meta)
diff --git a/tools/accuracy_checker/accuracy_checker/adapters/yolo.py b/tools/accuracy_checker/accuracy_checker/adapters/yolo.py
new file mode 100644
index 00000000000..1e67b411081
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/adapters/yolo.py
@@ -0,0 +1,345 @@
+import math
+
+import numpy as np
+
+from ..adapters import Adapter
+from ..config import NumberField, StringField, ConfigValidator, ListField, ConfigError
+from ..representation import DetectionPrediction
+from ..topology_types import YoloV1Tiny, YoloV2, YoloV2Tiny, YoloV3, YoloV3Tiny
+from ..utils import get_or_parse_value
+
+
+class TinyYOLOv1Adapter(Adapter):
+    """
+    Class for converting output of Tiny YOLO v1 model to DetectionPrediction representation
+    """
+    __provider__ = 'tiny_yolo_v1'
+    prediction_types = (DetectionPrediction, )
+    topology_types = (YoloV1Tiny, )
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        """
+        Args:
+            identifiers: list of input data identifiers
+            raw: output of model
+        Returns:
+             list of DetectionPrediction objects
+        """
+        prediction = self._extract_predictions(raw, frame_meta)[self.output_blob]
+
+        PROBABILITY_SIZE = 980
+        CONFIDENCE_SIZE = 98
+        BOXES_SIZE = 392
+
+        CELLS_X, CELLS_Y = 7, 7
+        CLASSES = 20
+        OBJECTS_PER_CELL = 2
+
+        result = []
+        for identifier, output in zip(identifiers, prediction):
+            assert PROBABILITY_SIZE + CONFIDENCE_SIZE + BOXES_SIZE == output.shape[0]
+
+            probability, scale, boxes = np.split(output, [PROBABILITY_SIZE, PROBABILITY_SIZE + CONFIDENCE_SIZE])
+
+            probability = np.reshape(probability, (CELLS_Y, CELLS_X, CLASSES))
+            scale = np.reshape(scale, (CELLS_Y, CELLS_X, OBJECTS_PER_CELL))
+            boxes = np.reshape(boxes, (CELLS_Y, CELLS_X, OBJECTS_PER_CELL, 4))
+
+            confidence = np.zeros((CELLS_Y, CELLS_X, OBJECTS_PER_CELL, CLASSES + 4))
+            for cls in range(CLASSES):
+                confidence[:, :, 0, cls] = np.multiply(probability[:, :, cls], scale[:, :, 0])
+                confidence[:, :, 1, cls] = np.multiply(probability[:, :, cls], scale[:, :, 1])
+
+            labels, scores, x_mins, y_mins, x_maxs, y_maxs = [], [], [], [], [], []
+            for i, j, k in np.ndindex((CELLS_X, CELLS_Y, OBJECTS_PER_CELL)):
+                box = boxes[j, i, k]
+                box = [(box[0] + i) / float(CELLS_X), (box[1] + j) / float(CELLS_Y), box[2] ** 2, box[3] ** 2]
+
+                label = np.argmax(confidence[j, i, k, :CLASSES])
+                score = confidence[j, i, k, label]
+
+                labels.append(label)
+                scores.append(score)
+                x_mins.append(box[0] - box[2] / 2.0)
+                y_mins.append(box[1] - box[3] / 2.0)
+                x_maxs.append(box[0] + box[2] / 2.0)
+                y_maxs.append(box[1] + box[3] / 2.0)
+
+            result.append(DetectionPrediction(identifier, labels, scores, x_mins, y_mins, x_maxs, y_maxs))
+
+        return result
+
+
+def entry_index(w, h, n_coords, n_classes, pos, entry):
+    row = pos // (w * h)
+    col = pos % (w * h)
+    return row * w * h * (n_classes + n_coords + 1) + entry * w * h + col
+
+
+class YoloV2Adapter(Adapter):
+    """
+    Class for converting output of YOLO v2 family models to DetectionPrediction representation
+    """
+    __provider__ = 'yolo_v2'
+    prediction_types = (DetectionPrediction, )
+    topology_types = (YoloV2, YoloV2Tiny, )
+
+    PRECOMPUTED_ANCHORS = {
+        'yolo_v2': [1.3221, 1.73145, 3.19275, 4.00944, 5.05587, 8.09892, 9.47112, 4.84053, 11.2364, 10.0071],
+        'tiny_yolo_v2': [1.08, 1.19, 3.42, 4.41, 6.63, 11.38, 9.42, 5.11, 16.62, 10.52]
+    }
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'classes': NumberField(
+                value_type=int, optional=True, min_value=1, default=20, description="Number of detection classes."
+            ),
+            'coords': NumberField(
+                value_type=int, optional=True, min_value=1, default=4, description="Number of bbox coordinates."
+            ),
+            'num': NumberField(
+                value_type=int, optional=True, min_value=1, default=5,
+                description="Num parameter from DarkNet configuration file."
+            ),
+            'anchors': StringField(
+                optional=True, choices=YoloV2Adapter.PRECOMPUTED_ANCHORS,
+                allow_own_choice=True, default='yolo_v2',
+                description="Anchor values provided as comma-separated list or one of precomputed: "
+                            "{}".format(', '.join(YoloV2Adapter.PRECOMPUTED_ANCHORS))
+            ),
+            'cells': NumberField(
+                value_type=int, optional=True, min_value=1, default=13,
+                description="Number of cells across width and height"
+            )
+        })
+        return parameters
+
+    def validate_config(self):
+        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
+
+    def configure(self):
+        self.classes = self.get_value_from_config('classes')
+        self.coords = self.get_value_from_config('coords')
+        self.num = self.get_value_from_config('num')
+        self.anchors = get_or_parse_value(self.get_value_from_config('anchors'), YoloV2Adapter.PRECOMPUTED_ANCHORS)
+        self.cells = self.get_value_from_config('cells')
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        """
+        Args:
+            identifiers: list of input data identifiers
+            raw: output of model
+        Returns:
+            list of DetectionPrediction objects
+        """
+        predictions = self._extract_predictions(raw, frame_meta)[self.output_blob]
+
+        cells_x, cells_y = self.cells, self.cells
+
+        result = []
+        for identifier, prediction in zip(identifiers, predictions):
+            labels, scores, x_mins, y_mins, x_maxs, y_maxs = [], [], [], [], [], []
+            if len(np.shape(prediction)) == 3:
+                prediction = prediction.flatten()
+            for y, x, n in np.ndindex((cells_y, cells_x, self.num)):
+                index = n * cells_y * cells_x + y * cells_x + x
+
+                box_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, 0)
+                obj_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords)
+
+                scale = prediction[obj_index]
+
+                box = [
+                    (x + prediction[box_index + 0 * (cells_y * cells_x)]) / cells_x,
+                    (y + prediction[box_index + 1 * (cells_y * cells_x)]) / cells_y,
+                    np.exp(prediction[box_index + 2 * (cells_y * cells_x)]) * self.anchors[2 * n + 0] / cells_x,
+                    np.exp(prediction[box_index + 3 * (cells_y * cells_x)]) * self.anchors[2 * n + 1] / cells_y
+                ]
+
+                classes_prob = np.empty(self.classes)
+                for cls in range(self.classes):
+                    cls_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords + 1 + cls)
+                    classes_prob[cls] = prediction[cls_index]
+
+                classes_prob = classes_prob * scale
+
+                label = np.argmax(classes_prob)
+
+                labels.append(label)
+                scores.append(classes_prob[label])
+                x_mins.append(box[0] - box[2] / 2.0)
+                y_mins.append(box[1] - box[3] / 2.0)
+                x_maxs.append(box[0] + box[2] / 2.0)
+                y_maxs.append(box[1] + box[3] / 2.0)
+
+            result.append(DetectionPrediction(identifier, labels, scores, x_mins, y_mins, x_maxs, y_maxs))
+
+        return result
+
+
+class YoloV3Adapter(Adapter):
+    """
+    Class for converting output of YOLO v3 family models to DetectionPrediction representation
+    """
+    __provider__ = 'yolo_v3'
+    prediction_types = (DetectionPrediction, )
+    topology_types = (YoloV3, YoloV3Tiny, )
+
+    PRECOMPUTED_ANCHORS = {
+        'yolo_v3': [
+            10.0, 13.0,
+            16.0, 30.0,
+            33.0, 23.0,
+            30.0, 61.0,
+            62.0, 45.0,
+            59.0, 119.0,
+            116.0, 90.0,
+            156.0, 198.0,
+            373.0, 326.0
+        ],
+        'tiny_yolo_v3': [
+            10.0, 14.0,
+            23.0, 27.0,
+            37.0, 58.0,
+            81.0, 82.0,
+            135.0, 169.0,
+            344.0, 319.0
+        ]
+    }
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'classes': NumberField(
+                value_type=int, optional=True, min_value=1, default=80, description="Number of detection classes."
+            ),
+            'coords': NumberField(
+                value_type=int, optional=True, min_value=1, default=4, description="Number of bbox coordinates."
+            ),
+            'num': NumberField(
+                value_type=int, optional=True, min_value=1, default=3,
+                description="Num parameter from DarkNet configuration file."
+            ),
+            'anchors': StringField(
+                optional=True, choices=YoloV3Adapter.PRECOMPUTED_ANCHORS.keys(), allow_own_choice=True,
+                default='yolo_v3',
+                description="Anchor values provided as comma-separated list or one of precomputed: "
+                            "{}.".format(', '.join(YoloV3Adapter.PRECOMPUTED_ANCHORS.keys()))),
+            'threshold': NumberField(value_type=float, optional=True, min_value=0, default=0.001,
+                                     description="Minimal objectiveness score value for valid detections."),
+            'outputs': ListField(
+                optional=True, default=[],
+                description="The list of output layers names (optional),"
+                            " if specified there should be exactly 3 output layers provided."
+            ),
+            'anchor_masks': ListField(optional=True, description='per layer used anchors mask')
+        })
+
+        return parameters
+
+    def validate_config(self):
+        super().validate_config(on_extra_argument=ConfigValidator.WARN_ON_EXTRA_ARGUMENT)
+
+    def configure(self):
+        self.classes = self.get_value_from_config('classes')
+        self.coords = self.get_value_from_config('coords')
+        self.num = self.get_value_from_config('num')
+        self.anchors = get_or_parse_value(self.get_value_from_config('anchors'), YoloV3Adapter.PRECOMPUTED_ANCHORS)
+        self.threshold = self.get_value_from_config('threshold')
+        self.outputs = self.get_value_from_config('outputs')
+        anchor_masks = self.get_value_from_config('anchor_masks')
+        self.masked_anchors = None
+        if anchor_masks is not None:
+            per_layer_anchors = []
+            for layer_mask in anchor_masks:
+                layer_anchors = []
+                for idx in layer_mask:
+                    layer_anchors += [self.anchors[idx * 2], self.anchors[idx * 2 + 1]]
+                per_layer_anchors.append(layer_anchors)
+            self.masked_anchors = per_layer_anchors
+
+    def process(self, raw, identifiers=None, frame_meta=None):
+        """
+        Args:
+            identifiers: list of input data identifiers
+            raw: output of model
+        Returns:
+            list of DetectionPrediction objects
+        """
+
+        def get_anchors_offset(x, num, anchors):
+            return int((num * 2) * (len(anchors) / (num * 2) - 1 - math.log2(x / 13)))
+
+        def parse_yolo_v3_results(prediction, threshold, w, h, det, layer_id):
+            cells_x, cells_y = prediction.shape[1:]
+            anchors = self.masked_anchors[layer_id] if self.masked_anchors else self.anchors
+            num = len(anchors) // 2 if self.masked_anchors else self.num
+            prediction = prediction.flatten()
+            for y, x, n in np.ndindex((cells_y, cells_x, num)):
+                index = n * cells_y * cells_x + y * cells_x + x
+                anchors_offset = get_anchors_offset(cells_x, num, anchors) if not self.masked_anchors else 0
+
+                box_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, 0)
+                obj_index = entry_index(cells_x, cells_y, self.coords, self.classes, index, self.coords)
+                scale = prediction[obj_index]
+                if scale < threshold:
+                    continue
+
+                box = [
+                    (x + prediction[box_index + 0 * (cells_y * cells_x)]) / cells_x,
+                    (y + prediction[box_index + 1 * (cells_y * cells_x)]) / cells_y,
+                    np.exp(prediction[box_index + 2 * (cells_y * cells_x)]) * anchors[anchors_offset + 2 * n + 0] / w,
+                    np.exp(prediction[box_index + 3 * (cells_y * cells_x)]) * anchors[anchors_offset + 2 * n + 1] / h
+                ]
+
+                classes_prob = np.empty(self.classes)
+                for cls in range(self.classes):
+                    cls_index = entry_index(cells_x, cells_y, self.coords, self.classes, index,
+                                            self.coords + 1 + cls)
+                    classes_prob[cls] = prediction[cls_index] * scale
+
+                    det['labels'].append(cls)
+                    det['scores'].append(classes_prob[cls])
+                    det['x_mins'].append(box[0] - box[2] / 2.0)
+                    det['y_mins'].append(box[1] - box[3] / 2.0)
+                    det['x_maxs'].append(box[0] + box[2] / 2.0)
+                    det['y_maxs'].append(box[1] + box[3] / 2.0)
+
+            return det
+
+        result = []
+
+        raw_outputs = self._extract_predictions(raw, frame_meta)
+
+        if self.outputs:
+            outputs = self.outputs
+        else:
+            outputs = raw_outputs.keys()
+
+        if self.masked_anchors and len(self.masked_anchors) != len(outputs):
+            raise ConfigError('anchor mask should be specified for all output layers')
+        batch = len(identifiers)
+        predictions = [[] for _ in range(batch)]
+        for blob in outputs:
+            for b in range(batch):
+                predictions[b].append(raw_outputs[blob][b])
+
+        for identifier, prediction, meta in zip(identifiers, predictions, frame_meta):
+            detections = {'labels': [], 'scores': [], 'x_mins': [], 'y_mins': [], 'x_maxs': [], 'y_maxs': []}
+            input_shape = list(meta.get('input_shape', {'data': (1, 3, 416, 416)}).values())[0]
+            nchw_layout = input_shape[1] == 3
+            self.input_width = input_shape[3 if nchw_layout else 2]
+            self.input_height = input_shape[2 if nchw_layout else 1]
+
+            for layer_id, p in enumerate(prediction):
+                parse_yolo_v3_results(p, self.threshold, self.input_width, self.input_height, detections, layer_id)
+
+            result.append(DetectionPrediction(
+                identifier, detections['labels'], detections['scores'], detections['x_mins'], detections['y_mins'],
+                detections['x_maxs'], detections['y_maxs']
+            ))
+
+        return result
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/README.md b/tools/accuracy_checker/accuracy_checker/annotation_converters/README.md
index 8e9d44f5eac..d97529b8458 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/README.md
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/README.md
@@ -49,57 +49,74 @@ You may refer to `-h, --help` to full list of command line options. Some optiona
 * `-a, --annotation_name` - annotation file name.
 * `-m, --meta_name` - meta info file name.
 
-### Supported converters 
+### Supported converters
 
 Accuracy Checker supports following list of annotation converters and specific for them parameters:
-* `cifar10` - converts CIFAR 10 classification dataset to `ClassificationAnnotation`
+* `cifar` - converts [CIFAR](https://www.cs.toronto.edu/~kriz/cifar.html) classification dataset to `ClassificationAnnotation`
   * `data_batch_file` - path to pickle file which contain dataset batch (e.g. test_batch)
-  * `has_background` - allows to add background label to original labels and convert dataset for 11 classes instead 10 (default value is False).
+  * `has_background` - allows to add background label to original labels (Optional, default value is False).
   * `convert_images` - allows to convert images from pickle file to user specified directory (default value is False).
   * `converted_images_dir` - path to converted images location.
+  * `num_classes` - the number of classes in the dataset - 10 or 100 (Optional, default 10)
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `mnist_csv` - convert MNIST dataset for handwritten digit recognition stored in csv format to `ClassificationAnnotation`.
   * `annotation_file` - path to dataset file in csv format.
   * `convert_images` - allows to convert images from annotation file to user specified directory (default value is False).
   * `converted_images_dir` - path to converted images location if enabled `convert_images`.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding). Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
+* `fashion_mnist` - convert [Fashion-MNIST](https://github.com/zalandoresearch/fashion-mnist) dataset to `ClassificationAnnotation`.
+  * `annotation_file` - path to labels file in binary format.
+  * `data_file` - path to images file in binary format.
+  * `convert_images` - allows to convert images from data file to user specified directory (default value is False).
+  * `converted_images_dir` - path to converted images location if enabled `convert_images`.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding). Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `imagenet` - convert ImageNet dataset for image classification task to `ClassificationAnnotation`.
   * `annotation_file` - path to annotation in txt format.
   * `labels_file` - path to file with word description of labels (synset_words).
   * `has_background` - allows to add background label to original labels and convert dataset for 1001 classes instead 1000 (default value is False).
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `voc_detection` - converts Pascal VOC annotation for detection task to `DetectionAnnotation`.
-   * `imageset_file` - path to file with validation image list.
-   * `annotations_dir` - path to directory with annotation files.
-   * `images_dir` - path to directory with images related to devkit root (default JPEGImages).
-  * `has_background` - allows convert dataset with/without adding background_label. Accepted values are True or False. (default is True) 
+  * `imageset_file` - path to file with validation image list.
+  * `annotations_dir` - path to directory with annotation files.
+  * `images_dir` - path to directory with images related to devkit root (default JPEGImages).
+  * `has_background` - allows convert dataset with/without adding background_label. Accepted values are True or False. (default is True)
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `voc_segmentation` - converts Pascal VOC annotation for semantic segmentation task to `SegmentationAnnotation`.
   * `imageset_file` - path to file with validation image list.
   * `images_dir` - path to directory with images related to devkit root (default JPEGImages).
   * `mask_dir` - path to directory with ground truth segmentation masks related to devkit root (default SegmentationClass).
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `mscoco_detection` - converts MS COCO dataset for object detection task to `DetectionAnnotation`.
   * `annotation_file` - path ot annotation file in json format.
   * `has_background` - allows convert dataset with/without adding background_label. Accepted values are True or False. (default is False).
   * `use_full_label_map` - allows to use original label map (with 91 object categories) from paper instead public available(80 categories).
   * `sort_annotations` - allows to save annotations in image id ascend order.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `mscoco_segmentation` - converts MS COCO dataset for object instance segmentation task to `CocoInstanceSegmentationAnnotation`.
   * `annotation_file` - path ot annotation file in json format.
   * `has_background` - allows convert dataset with/without adding background_label. Accepted values are True or False. (default is False).
   * `use_full_label_map` - allows to use original label map (with 91 object categories) from paper instead public available(80 categories).
   * `sort_annotations` - allows to save annotations in image id ascend order.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `mscoco_mask_rcnn` - converts MS COCO dataset to `ContainerAnnotation` with `DetectionAnnotation` and `CocoInstanceSegmentationAnnotation` named `detection_annotation` and `segmentation_annotation` respectively.
   * `annotation_file` - path ot annotation file in json format.
   * `has_background` - allows convert dataset with/without adding background_label. Accepted values are True or False. (default is False).
   * `use_full_label_map` - allows to use original label map (with 91 object categories) from paper instead public available(80 categories).
   * `sort_annotations` - allows to save annotations in image id ascend order.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `mscoco_keypoints` - converts MS COCO dataset for keypoints localization task to `PoseEstimationAnnotation`.
   * `annotation_file` - path ot annotation file in json format.
 * `wider` - converts from Wider Face dataset to `DetectionAnnotation`.
   * `annotation_file` - path to txt file, which contains ground truth data in WiderFace dataset format.
   * `label_start` - specifies face label index in label map. Default value is 1. You can provide another value, if you want to use this dataset for separate label validation,
   in case when your network predicts other class for faces.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `detection_opencv_storage` - converts detection annotation stored in Detection OpenCV storage format to `DetectionAnnotation`.
   * `annotation_file` - path to annotation in xml format.
   * `image_names_file` - path to txt file, which contains image name list for dataset.
   * `label_start` - specifies label index start in label map. Default value is 1. You can provide another value, if you want to use this dataset for separate label validation.
   * `background_label` - specifies which index will be used for background label. You can not provide this parameter if your dataset has not background label.
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `cityscapes` - converts CityScapes Dataset to `SegmentationAnnotation`.
   * `dataset_root_dir` - path to dataset root.
   * `images_subfolder` - path from dataset root to directory with validation images (Optional, default `imgsFine/leftImg8bit/val`).
@@ -107,6 +124,7 @@ Accuracy Checker supports following list of annotation converters and specific f
   * `masks_suffix` - suffix for mask file names (Optional, default `_gtFine_labelTrainIds`).
   * `images_suffix` - suffix for image file names (Optional, default `_leftImg8bit`).
   * `use_full_label_map` - allows to use full label map with 33 classes instead train label map with 18 classes (Optional, default `False`).
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `vgg_face` - converts VGG Face 2 dataset for facial landmarks regression task to `FacialLandmarksAnnotation`.
   * `landmarks_csv_file` - path to csv file with coordinates of landmarks points.
   * `bbox_csv_file` - path to cvs file which contains bounding box coordinates for faces (optional parameter).
@@ -118,18 +136,29 @@ Accuracy Checker supports following list of annotation converters and specific f
   * `data_dir` - path to data directory, where gallery (`bbox_test`) and `query` subdirectories are located.
 * `market1501_reid` - converts Market1501 person reidentification dataset to `ReidentificationAnnotation`.
   * `data_dir` - path to data directory, where gallery (`bounding_box_test`) and `query` subdirectories are located.
-* `super_resolution` - converts dataset for super resolution task to `SuperResolutionAnnotation`.
+* `super_resolution` - converts dataset for single image super resolution task to `SuperResolutionAnnotation`.
   * `data_dir` - path to folder, where images in low and high resolution are located.
   * `lr_suffix` - low resolution file name's suffix (default lr).
   * `hr_suffix` - high resolution file name's suffix (default hr).
   * `annotation_loader` - which library will be used for ground truth image reading. Supported: `opencv`, `pillow` (Optional. Default value is pillow). Note, color space of image depends on loader (OpenCV uses BGR, Pillow uses RGB for image reading).
+  * `two_streams` - enable 2 input streams where usually first for original image and second for upsampled image. (Optional, default False).
+  * `upsample_suffix` - upsample images file name's suffix (default upsample).
+* `multi_frame_super_resolution` - converts dataset for super resolution task with multiple input frames usage.
+    * `data_dir` - path to folder, where images in low and high resolution are located.
+    * `lr_suffix` - low resolution file name's suffix (default lr).
+    * `hr_suffix` - high resolution file name's suffix (default hr).
+    * `annotation_loader` - which library will be used for ground truth image reading. Supported: `opencv`, `pillow` (Optional. Default value is pillow). Note, color space of image depends on loader (OpenCV uses BGR, Pillow uses RGB for image reading).
+    * `number_input_frames` - the number of input frames per inference.
 * `icdar_detection` - converts ICDAR13 and ICDAR15 datasets for text detection challenge to `TextDetectionAnnotation`.
   * `data_dir` - path to folder with annotations on txt format.
+  * `word_spotting` - if it is true then transcriptions that have lengths less than 3 symbols or transcriptions containing non-alphanumeric symbols will be marked as difficult.
 * `icdar13_recognition` - converts ICDAR13 dataset for text recognition task to `CharecterRecognitionAnnotation`.
   * `annotation_file` - path to annotation file in txt format.
 * `brats` - converts BraTS dataset format to `BrainTumorSegmentationAnnotation` format.
   * `data_dir` - dataset root directory, which contain subdirectories with validation data (`imagesTr`) and ground truth labels (`labelsTr`).
   Optionally you can provide relative path for these subdirectories (if they have different location) using `image_folder` and `mask_folder` parameters respectively.
+  * `mask_channels_first` - allows read gt mask nifti files and transpose in order where channels first (Optional, default False)
+  * `labels_file` - path to file, which contains labels (optional, if omitted no labels will be shown)
 * `movie_lens_converter` - converts Movie Lens Datasets format to `HitRatioAnnotation` format.
   * `rating_file` - path to file which contains movieId with top score for each userID (for example ml-1m-test-ratings.csv)
   * `negative_file` - path to file which contains negative examples.
@@ -154,9 +183,10 @@ Accuracy Checker supports following list of annotation converters and specific f
   * `mask_prefix` - prefix part for mask file names. (Optional, default is empty).
   * `image_postfix` - postfix part for mask file names (optional, default is `.png`).
   * `mask_loader` - the way how GT mask should be loaded. Supported methods: `pillow`, `opencv`, `nifti`, `numpy`, `scipy`.
-  * `dataset_meta` - path to json file with prepared dataset meta info. It should contains `label_map` key with dictionary in format class_id: class_name and optionally `segmentation_colors` (if your dataset uses color encoding). Segmentation colors is a list of channel-wise values for each class. (e.g. if your dataset has 3 classes in BGR colors, segmentation colors for it will looks like: `[[255, 0, 0], [0, 255, 0], [0, 0, 255]]`). (Optional, you can provide self-created file as `dataset_meta` in your config).
+  * `dataset_meta_file` - path to json file with prepared dataset meta info. It should contains `label_map` key with dictionary in format class_id: class_name and optionally `segmentation_colors` (if your dataset uses color encoding). Segmentation colors is a list of channel-wise values for each class. (e.g. if your dataset has 3 classes in BGR colors, segmentation colors for it will looks like: `[[255, 0, 0], [0, 255, 0], [0, 0, 255]]`). (Optional, you can provide self-created file as `dataset_meta` in your config).
 * `camvid` - converts CamVid dataset format to `SegmentationAnnotation`.
   * `annotation_file` - file in txt format which contains list of validation pairs (`<path_to_image>` `<path_to_annotation>` separated by space)
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `image_retrieval` - converts dataset for image retrieval task to `ReidentificationAnnotation`. Dataset should have following structure:
    1. the dataset root directory contains 2 subdirectory named `gallery` and `queries` for gallery images and query images respectively.
    2. Every of these subdirectories should contains text file with list of pairs: `<path_to_image>` `<image_ID>` (image_path and image_ID should be separated by space),  where `<path_to_image>` is path to the image related dataset root, `<image_ID>` is the number which represent image id in the gallery.
@@ -166,6 +196,7 @@ Accuracy Checker supports following list of annotation converters and specific f
 * `cvat_object_detection` - converts [CVAT XML annotation version 1.1](https://github.com/opencv/cvat/blob/develop/cvat/apps/documentation/xml_format.md#xml-annotation-format) format for images to `DetectionAnnotation`.
   * `annotation_file` - path to xml file in appropriate format.
   * `has_background` - allows prepend original labels with special class represented background and convert dataset for n+1 classes instead n (default value is True).
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
 * `cvat_attributes_recognition` - converts [CVAT XML annotation version 1.1](https://github.com/opencv/cvat/blob/develop/cvat/apps/documentation/xml_format.md#xml-annotation-format) format for images to `ClassificationAnnotation` or `ContainerAnnotation` with `ClassificationAnnotation` as value type and attribute names as keys (in multiple attributes case). Used bbox attributes as annotation classes.
   * `annotation_file` - path to xml file in appropriate format.
   * `label` - the dataset label which will be used for attributes collection (e.g. if your dataset contains 2 labels: `face` and `person` and you want recognise attributes for face, you should use `face` as value for this parameter).
@@ -190,3 +221,82 @@ Accuracy Checker supports following list of annotation converters and specific f
 * `lpr_txt` - converts annotation for license plate recognition task in txt format to `CharacterRecognitionAnnotation`.
   * `annotation_file` - path to txt annotation.
   * `decoding_dictionary` - path to file containing dictionary for output decoding.
+* `squad` - converts the Stanford Question Answering Dataset ([SQuAD](https://rajpurkar.github.io/SQuAD-explorer/)) to `Question Answering Annotation`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `testing_file` - path to testing file.
+  * `vocab_file` - path to model co vocabulary file.
+  * `max_seq_length` - maximum total input sequence length after word-piece tokenization (Optional, default value is 128).
+  * `max_query_length` - maximum number of tokens for the question (Optional, default value is 64).
+  * `doc_stride` -stride size between chunks for splitting up long document (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False)
+* `xnli` - converts The Cross-lingual Natural Language Inference Corpus ([XNLI](https://github.com/facebookresearch/XNLI)) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` -  path to model vocabulary file for WordPiece tokinezation (Optional in case, when another tokenization approach used).
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after word-piece tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+  * `language_filter` - comma-separated list of used in annotation language tags for selecting records for specific languages only. (Optional, if not used full annotation will be converted).
+* `mnli` - converts The Multi-Genre Natural Language Inference Corpus ([MNLI](http://www.nyu.edu/projects/bowman/multinli/)) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` - path to model vocabulary file for WordPiece tokinezation. (Optional, can be not provided in case, when another tokenization approach used.)
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+* `mrpc` - converts The Microsoft Research Paraphrase Corpus ([MRPC](https://www.microsoft.com/en-us/download/details.aspx?id=52398)) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` - path to model vocabulary file for WordPiece tokenization. (Optional, can be not provided in case, when another tokenization approach used.)
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+* `cola` - converts The Corpus of Linguistic Acceptability ([CoLA](https://nyu-mll.github.io/CoLA/)) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` - path to model vocabulary file for WordPiece tokinezation. (Optional, can be not provided in case, when another tokenization approach used.)
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+* `cola` - converts The Corpus of Linguistic Acceptability ([CoLA](https://nyu-mll.github.io/CoLA/)) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` - path to model vocabulary file for WordPiece tokenization. (Optional, can be not provided in case, when another tokenization approach used.)
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+* `imdb` - converts [IMDB sentiment dataset](https://ai.stanford.edu/~amaas/data/sentiment/) to `TextClassificationAnnotattion`. **Note: This converter not only converts data to metric specific format but also tokenize and encodes input for BERT.**
+  * `annotation_file` - path to dataset annotation file in tsv format.
+  * `vocab_file` - path to model vocabulary file for WordPiece tokinezation. (Optional, can be not provided in case, when another tokenization approach used.)
+  * `sentence_piece_model_file` - model used for [SentencePiece](https://github.com/google/sentencepiece) tokenization (Optional in case, when another tokenization approach used).
+  * `max_seq_length` - maximum total input sequence length after tokenization (Optional, default value is 128).
+  * `lower_case` - allows switching tokens to lower case register. It is useful for working with uncased models (Optional, default value is False).
+* `bert_xnli_tf_record` - converts The Cross-lingual Natural Language Inference Corpus ([XNLI](https://github.com/facebookresearch/XNLI)) stored in tf records format. This converter usage requires TensorFlow installation. Please make sure that TensorFlow installed before conversion.
+  * `annotattion_file` - path to annotation file in tf records format.
+* `cmu_panoptic_keypoints` - converts CMU Panoptic dataset to `PoseEstimation3dAnnotation` format.
+  * `data_dir` - dataset root directory, which contain subdirectories with validation scenes data.
+* `clip_action_recognition` - converts annotation video-based action recognition datasets. Before conversion validation set should be preprocessed using approach described [here](https://github.com/opencv/openvino_training_extensions/tree/develop/pytorch_toolkit/action_recognition#preparation).
+  * `annotation_file` - path to annotation file in json format.
+  * `data_dir` - path to directory with prepared data (e. g. data/kinetics/frames_data).
+  * `clips_per_video` - number of clips per video (Optional, default 3).
+  * `clip_duration` - clip duration (Optional, default 16)
+  * `temporal_stride` - temporal stride for frames selection (Optional, default 2).
+  * `numpy_input` - allows usage numpy files instead images. It can be useful if data required difficult preprocessing steps (e.g. conversion to optical flow) (Optional, default `False`)
+  * `subset` - dataset split: `train`, `validation` or `test` (Optional, default `validation`).
+  * `dataset_meta_file` - path path to json file with dataset meta (e.g. label_map, color_encoding).Optional, more details in [Customizing dataset meta](#customizing-dataset-meta) section.
+* `continuous_clip_action_recognition` - converts annotation of video-based MS-ASL dataset to `ClassificationAnnotation`.
+  * `annotation_file` - path to annotation file in txt format.
+  * `data_dir` - dataset root directory, which contains subdirectories with extracted video frames.
+  * `out_fps` - output frame rate of generated video clips.
+  * `clip_length` - number of frames of generated video clips.
+
+### Customizing dataset meta
+There are situations when we need customize some default dataset parameters (e.g. replace original dataset label map with own.)
+You are able to overload parameters such as `label_map`, `segmentation_colors`, `backgound_label` using `dataset_meta_file` argument.
+dataset meta file is JSON file, which can contains following parameters:
+  * `label_map` is dictionary where <CLASS_ID> is key and <CLASS_NAME> - value.
+  * `labels` is the list of strings, which represent class names (order is matter, the index of class name used as class id). Can be used instead `label_map`.
+  * `background_label` - id of background label in the dataset.
+  * `segmentation_colors` (if your dataset for semantic segmentation task uses color encoding). Segmentation colors is a list of channel-wise values for each class. (e.g. if your dataset has 3 classes in BGR colors, segmentation colors for it will looks like: `[[255, 0, 0], [0, 255, 0], [0, 0, 255]]`).
+Example of dataset_meta.json content:
+```json
+{
+"label_map": {"0": "background", "1": "cat", "2": "dog"},
+"background_label": "0",
+"segmentation_colors": [[0, 0, 0], [255, 0, 0], [0, 0, 255]]
+}
+```
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/__init__.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/__init__.py
index 28b7f40ce1f..5e5a7ab953a 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/__init__.py
@@ -24,14 +24,14 @@
 from .detection_opencv_storage import DetectionOpenCVStorageFormatConverter
 from .lfw import LFWConverter
 from .vgg_face_regression import VGGFaceRegressionConverter
-from .super_resolution_converter import SRConverter
+from .super_resolution_converter import SRConverter, SRMultiFrameConverter
 from .imagenet import ImageNetFormatConverter
 from .icdar import ICDAR13RecognitionDatasetConverter, ICDAR15DetectionDatasetConverter
-from .ms_coco import MSCocoDetectionConverter, MSCocoKeypointsConverter
+from .ms_coco import MSCocoDetectionConverter, MSCocoKeypointsConverter, MSCocoSingleKeypointsConverter
 from .cityscapes import CityscapesConverter
 from .ncf_converter import MovieLensConverter
 from .brats import BratsConverter, BratsNumpyConverter
-from .cifar10 import Cifar10FormatConverter
+from .cifar import CifarFormatConverter
 from .mnist import MNISTCSVFormatConverter
 from .wmt import WMTConverter
 from .common_semantic_segmentation import CommonSegmentationConverter
@@ -46,6 +46,18 @@
 from .cvat_multilabel_recognition import CVATMultilabelAttributesRecognitionConverter
 from .cvat_human_pose import CVATPoseEstimationConverter
 from .cvat_person_detection_action_recognition import CVATPersonDetectionActionRecognitionConverter
+from .squad import SQUADConverter
+from .text_classification import (
+    XNLIDatasetConverter,
+    BertXNLITFRecordConverter,
+    IMDBConverter,
+    MRPCConverter,
+    CoLAConverter
+)
+from .cmu_panoptic import CmuPanopticKeypointsConverter
+from .action_recognition import ActionRecognitionConverter
+from .ms_asl_continuous import MSASLContiniousConverter
+from .fashion_mnist import FashionMnistConverter
 
 __all__ = [
     'BaseFormatConverter',
@@ -63,15 +75,17 @@
     'LFWConverter',
     'VGGFaceRegressionConverter',
     'SRConverter',
+    'SRMultiFrameConverter',
     'ICDAR13RecognitionDatasetConverter',
     'ICDAR15DetectionDatasetConverter',
     'MSCocoKeypointsConverter',
+    'MSCocoSingleKeypointsConverter',
     'MSCocoDetectionConverter',
     'CityscapesConverter',
     'MovieLensConverter',
     'BratsConverter',
     'BratsNumpyConverter',
-    'Cifar10FormatConverter',
+    'CifarFormatConverter',
     'MNISTCSVFormatConverter',
     'WMTConverter',
     'CommonSegmentationConverter',
@@ -85,5 +99,15 @@
     'CVATTextRecognitionConverter',
     'CVATMultilabelAttributesRecognitionConverter',
     'CVATPoseEstimationConverter',
-    'CVATPersonDetectionActionRecognitionConverter'
+    'CVATPersonDetectionActionRecognitionConverter',
+    'SQUADConverter',
+    'XNLIDatasetConverter',
+    'BertXNLITFRecordConverter',
+    'IMDBConverter',
+    'MRPCConverter',
+    'CoLAConverter',
+    'CmuPanopticKeypointsConverter',
+    'ActionRecognitionConverter',
+    'MSASLContiniousConverter',
+    'FashionMnistConverter'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/_nlp_common.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/_nlp_common.py
new file mode 100644
index 00000000000..181ed035f3c
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/_nlp_common.py
@@ -0,0 +1,304 @@
+import unicodedata
+try:
+    import sentencepiece as spm
+except ImportError:
+    spm = None
+from ..config import ConfigError
+from ..utils import contains_all
+
+
+SPIECE_UNDERLINE = '\N{LOWER ONE EIGHTH BLOCK}'
+SEG_ID_A = 0
+SEG_ID_B = 1
+SEG_ID_CLS = 2
+SEG_ID_SEP = 3
+SEG_ID_PAD = 4
+special_symbols = {
+    "<unk>": 0,
+    "<s>": 1,
+    "</s>": 2,
+    "<cls>": 3,
+    "<sep>": 4,
+    "<pad>": 5,
+    "<mask>": 6,
+    "<eod>": 7,
+    "<eop>": 8,
+}
+
+UNK_ID = special_symbols["<unk>"]
+CLS_ID = special_symbols["<cls>"]
+SEP_ID = special_symbols["<sep>"]
+MASK_ID = special_symbols["<mask>"]
+EOD_ID = special_symbols["<eod>"]
+
+
+WORD_PIECE_PARAMETERS = ['vocab_file']
+SENTENCE_PIECE_PARAMETERS = ['sentence_piece_model_file']
+
+
+def get_tokenizer(config, lower_case):
+    tokenizer = None
+    if contains_all(config, WORD_PIECE_PARAMETERS + SENTENCE_PIECE_PARAMETERS):
+        raise ConfigError(
+            'tokenization method can not be understood correctly from parameters, please provide: \n'
+            'for WordPiece tokenization - {}\nfor SentencePiece tokenization - {}\n'.format(
+                ', '.join(WORD_PIECE_PARAMETERS), ', '.join(SENTENCE_PIECE_PARAMETERS))
+        )
+    if contains_all(config, WORD_PIECE_PARAMETERS):
+        tokenizer = WordPieceTokenizer(config['vocab_file'], lower_case)
+
+    if contains_all(config, SENTENCE_PIECE_PARAMETERS):
+        tokenizer = SentencePieceTokenizer(config['sentence_piece_model_file'], lower_case)
+
+    if tokenizer is None:
+        raise ConfigError(
+            'tokenization parameters is not found, please provide: \n'
+            'for WordPiece tokenization - {}\nfor SentencePiece tokenization - {}\n'.format(
+                ', '.join(WORD_PIECE_PARAMETERS), ', '.join(SENTENCE_PIECE_PARAMETERS))
+        )
+    return tokenizer
+
+
+class WordPieceTokenizer:
+    def __init__(self, vocab_file, lower_case=True, tokenize_chinese_chars=True):
+        self.vocab = self.load_vocab(vocab_file)
+        self.lower_case = lower_case
+        self.tokenize_chinese_chars = tokenize_chinese_chars
+
+    @staticmethod
+    def _run_strip_accents(text):
+        text = unicodedata.normalize("NFD", text)
+        output = []
+        for char in text:
+            cat = unicodedata.category(char)
+            if cat == "Mn":
+                continue
+            output.append(char)
+        return "".join(output)
+
+    @staticmethod
+    def _run_split_on_punc(text):
+        def _is_punctuation(char):
+            punct = set('!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~')
+            if char in punct:
+                return True
+            cat = unicodedata.category(char)
+            if cat.startswith("P"):
+                return True
+            return False
+
+        chars = list(text)
+        i = 0
+        start_new_word = True
+        output = []
+        while i < len(chars):
+            char = chars[i]
+            if _is_punctuation(char):
+                output.append([char])
+                start_new_word = True
+            else:
+                if start_new_word:
+                    output.append([])
+                start_new_word = False
+                output[-1].append(char)
+            i += 1
+
+        return ["".join(x) for x in output]
+
+    def basic_tokenizer(self, text):
+        if isinstance(text, bytes):
+            text = text.decode("utf-8", "ignore")
+
+        if self.tokenize_chinese_chars:
+            text = self._tokenize_chinese_chars(text)
+
+        text = text.strip()
+        tokens = text.split() if text else []
+        split_tokens = []
+        for token in tokens:
+            if self.lower_case:
+                token = token.lower()
+                token = self._run_strip_accents(token)
+            split_tokens.extend(self._run_split_on_punc(token))
+
+        output_tokens = " ".join(split_tokens)
+        output_tokens = output_tokens.strip()
+        output_tokens = output_tokens.split() if output_tokens else []
+        return output_tokens
+
+    def _tokenize_chinese_chars(self, text):
+        """Adds whitespace around any CJK character."""
+        output = []
+        for char in text:
+            cp = ord(char)
+            if self._is_chinese_char(cp):
+                output.append(" ")
+                output.append(char)
+                output.append(" ")
+            else:
+                output.append(char)
+        return "".join(output)
+
+    @staticmethod
+    def _is_chinese_char(cp):
+        """Checks whether CP is the codepoint of a CJK character."""
+        # This defines a "chinese character" as anything in the CJK Unicode block:
+        #   https://en.wikipedia.org/wiki/CJK_Unified_Ideographs_(Unicode_block)
+        #
+        # Note that the CJK Unicode block is NOT all Japanese and Korean characters,
+        # despite its name. The modern Korean Hangul alphabet is a different block,
+        # as is Japanese Hiragana and Katakana. Those alphabets are used to write
+        # space-separated words, so they are not treated specially and handled
+        # like the all of the other languages.
+
+        #pylint:disable=chained-comparison
+        #pylint:disable=too-many-boolean-expressions
+        if ((cp >= 0x4E00 and cp <= 0x9FFF) or  #
+                (cp >= 0x3400 and cp <= 0x4DBF) or  #
+                (cp >= 0x20000 and cp <= 0x2A6DF) or  #
+                (cp >= 0x2A700 and cp <= 0x2B73F) or  #
+                (cp >= 0x2B740 and cp <= 0x2B81F) or  #
+                (cp >= 0x2B820 and cp <= 0x2CEAF) or
+                (cp >= 0xF900 and cp <= 0xFAFF) or  #
+                (cp >= 0x2F800 and cp <= 0x2FA1F)):  #
+            return True
+
+        return False
+
+    def wordpiece_tokenizer(self, text):
+        if isinstance(text, bytes):
+            text = text.decode("utf-8", "ignore")
+
+        output_tokens = []
+        text = text.strip()
+        tokens = text.split() if text else []
+        for token in tokens:
+            chars = list(token)
+            if len(chars) > 200:
+                output_tokens.append("[UNK]")
+                continue
+
+            is_bad = False
+            start = 0
+            sub_tokens = []
+            while start < len(chars):
+                end = len(chars)
+                cur_substr = None
+                while start < end:
+                    substr = "".join(chars[start:end])
+                    if start > 0:
+                        substr = "##" + substr
+                    if substr in self.vocab:
+                        cur_substr = substr
+                        break
+                    end -= 1
+                if cur_substr is None:
+                    is_bad = True
+                    break
+                sub_tokens.append(cur_substr)
+                start = end
+
+            if is_bad:
+                output_tokens.append("[UNK]")
+            else:
+                output_tokens.extend(sub_tokens)
+        return output_tokens
+
+    def tokenize(self, text):
+        tokens = []
+        for token in self.basic_tokenizer(text):
+            for sub_token in self.wordpiece_tokenizer(token):
+                tokens.append(sub_token)
+
+        return tokens
+
+    def convert_tokens_to_ids(self, items):
+        output = []
+        for item in items:
+            output.append(self.vocab[item])
+        return output
+
+    @staticmethod
+    def load_vocab(file):
+        vocab = {}
+        index = 0
+        with open(str(file), 'r') as reader:
+            while True:
+                token = reader.readline()
+                if isinstance(token, bytes):
+                    token = token.decode("utf-8", "ignore")
+                if not token:
+                    break
+                token = token.strip()
+                vocab[token] = index
+                index += 1
+        return vocab
+
+
+def truncate_seq_pair(tokens_a, tokens_b, max_length):
+    """Truncates a sequence pair in place to the maximum length."""
+
+    # This is a simple heuristic which will always truncate the longer sequence
+    # one token at a time. This makes more sense than truncating an equal percent
+    # of tokens from each, since if one sequence is very short then each token
+    # that's truncated likely contains more information than a longer sequence.
+    while True:
+        total_length = len(tokens_a) + len(tokens_b)
+        if total_length <= max_length:
+            break
+        if len(tokens_a) > len(tokens_b):
+            tokens_a.pop()
+        else:
+            tokens_b.pop()
+
+
+class SentencePieceTokenizer:
+    def __init__(self, tokenizer_model, lower_case=True, remove_space=True):
+        if spm is None:
+            raise ConfigError('Sentence piece tokenizer required sentencepiece, please install it before usage')
+        self.encoder = spm.SentencePieceProcessor()
+        self.encoder.Load(str(tokenizer_model))
+        self.lower_case = lower_case
+        self.remove_space = remove_space
+
+    def preprocess_text(self, inputs):
+        if self.remove_space:
+            outputs = ' '.join(inputs.strip().split())
+        else:
+            outputs = inputs
+
+        outputs = outputs.replace("``", '"').replace("''", '"')
+        if self.lower_case:
+            outputs = outputs.lower()
+
+        return outputs
+
+    def encode_ids(self, text, sample=False):
+        pieces = self.encode_pieces(text, sample)
+        ids = [self.encoder.PieceToId(piece) for piece in pieces]
+        return ids
+
+    def encode_pieces(self, text, sample=False):
+        if not sample:
+            pieces = self.encoder.EncodeAsPieces(text)
+        else:
+            pieces = self.encoder.SampleEncodeAsPieces(text, 64, 0.1)
+        new_pieces = []
+        for piece in pieces:
+            if len(piece) > 1 and piece[-1] == ',' and piece[-2].isdigit():
+                cur_pieces = self.encoder.EncodeAsPieces(
+                    piece[:-1].replace(SPIECE_UNDERLINE, ''))
+                if piece[0] != SPIECE_UNDERLINE and cur_pieces[0][0] == SPIECE_UNDERLINE:
+                    if len(cur_pieces[0]) == 1:
+                        cur_pieces = cur_pieces[1:]
+                    else:
+                        cur_pieces[0] = cur_pieces[0][1:]
+                cur_pieces.append(piece[-1])
+                new_pieces.extend(cur_pieces)
+            else:
+                new_pieces.append(piece)
+        return new_pieces
+
+    def tokenize(self, text):
+        text = self.preprocess_text(text)
+        return self.encode_ids(text)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/action_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/action_recognition.py
new file mode 100644
index 00000000000..ce872c5570a
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/action_recognition.py
@@ -0,0 +1,172 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from ..utils import read_json, read_txt, check_file_existence
+from ..representation import ClassificationAnnotation
+from ..data_readers import ClipIdentifier
+from ..config import PathField, NumberField, StringField, BoolField
+
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
+
+
+class ActionRecognitionConverter(BaseFormatConverter):
+    __provider__ = 'clip_action_recognition'
+    annotation_types = (ClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'annotation_file': PathField(description="Path to annotation file."),
+            'data_dir': PathField(is_directory=True, description="Path to data directory."),
+            'clips_per_video': NumberField(
+                value_type=int, optional=True, min_value=0, default=3, description="Number of clips per video."
+            ),
+            'clip_duration': NumberField(
+                value_type=int, optional=True, min_value=0, default=16, description="Clip duration."
+            ),
+            'temporal_stride': NumberField(
+                value_type=int, optional=True, min_value=0, default=2, description="Temporal Stride."
+            ),
+            'subset': StringField(
+                choices=['train', 'test', 'validation'], default='validation',
+                optional=True, description="Subset: train, test or validation."
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map)', optional=True
+            ),
+            'numpy_input': BoolField(description='use numpy arrays instead of images', optional=True, default=False)
+        })
+
+        return params
+
+    def configure(self):
+        self.annotation_file = self.get_value_from_config('annotation_file')
+        self.data_dir = self.get_value_from_config('data_dir')
+        self.clips_per_video = self.get_value_from_config('clips_per_video')
+        self.clip_duration = self.get_value_from_config('clip_duration')
+        self.temporal_stride = self.get_value_from_config('temporal_stride')
+        self.subset = self.get_value_from_config('subset')
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
+        self.numpy_input = self.get_value_from_config('numpy_input')
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        full_annotation = read_json(self.annotation_file)
+        data_ext = 'jpg' if not self.numpy_input else 'npy'
+        label_map = dict(enumerate(full_annotation['labels']))
+        if self.dataset_meta:
+            dataset_meta = read_json(self.dataset_meta)
+            if 'label_map' in dataset_meta:
+                label_map = dataset_meta['label_map']
+                label_map = verify_label_map(label_map)
+            elif 'labels' in dataset_meta:
+                label_map = dict(enumerate(dataset_meta['labels']))
+        video_names, annotation = self.get_video_names_and_annotations(full_annotation['database'], self.subset)
+        class_to_idx = {v: k for k, v in label_map.items()}
+
+        videos = []
+        for video_name, annotation in zip(video_names, annotation):
+            video_path = self.data_dir / video_name
+            if not video_path.exists():
+                continue
+
+            n_frames_file = video_path / 'n_frames'
+            n_frames = (
+                int(read_txt(n_frames_file)[0].rstrip('\n\r')) if n_frames_file.exists()
+                else len(list(video_path.glob('*.{}'.format(data_ext))))
+            )
+            if n_frames <= 0:
+                continue
+
+            begin_t = 1
+            end_t = n_frames
+            sample = {
+                'video': video_path,
+                'video_name': video_name,
+                'segment': [begin_t, end_t],
+                'n_frames': n_frames,
+                'video_id': video_name,
+                'label': class_to_idx[annotation['label']]
+            }
+
+            videos.append(sample)
+
+        videos = sorted(videos, key=lambda v: v['video_id'].split('/')[-1])
+
+        clips = []
+        for video in videos:
+            for clip in self.get_clips(video, self.clips_per_video, self.clip_duration, self.temporal_stride, data_ext):
+                clips.append(clip)
+
+        annotations = []
+        num_iterations = len(clips)
+        content_errors = None if not check_content else []
+        for clip_idx, clip in enumerate(clips):
+            if progress_callback is not None and clip_idx % progress_interval:
+                progress_callback(clip_idx * 100 / num_iterations)
+            identifier = ClipIdentifier(clip['video_name'], clip_idx, clip['frames'])
+            if check_content:
+                content_errors.extend([
+                    '{}: does not exist'.format(self.data_dir / frame)
+                    for frame in clip['frames'] if not check_file_existence(self.data_dir / frame)
+                ])
+            annotations.append(ClassificationAnnotation(identifier, clip['label']))
+
+        return ConverterReturn(annotations, {'label_map': label_map}, content_errors)
+
+    @staticmethod
+    def get_clips(video, clips_per_video, clip_duration, temporal_stride=1, file_ext='jpg'):
+        num_frames = video['n_frames']
+        clip_duration *= temporal_stride
+
+        if clips_per_video == 0:
+            step = clip_duration
+        else:
+            step = max(1, (num_frames - clip_duration) // (clips_per_video - 1))
+
+        for clip_start in range(1, 1 + clips_per_video * step, step):
+            clip_end = min(clip_start + clip_duration, num_frames + 1)
+
+            clip_idxs = list(range(clip_start, clip_end))
+
+            if not clip_idxs:
+                return
+
+            # loop clip if it is shorter than clip_duration
+            while len(clip_idxs) < clip_duration:
+                clip_idxs = (clip_idxs * 2)[:clip_duration]
+
+            clip = dict(video)
+            frames_idx = clip_idxs[::temporal_stride]
+            clip['frames'] = ['image_{:05d}.{}'.format(frame_idx, file_ext) for frame_idx in frames_idx]
+            yield clip
+
+    @staticmethod
+    def get_video_names_and_annotations(data, subset):
+        video_names = []
+        annotations = []
+
+        for key, value in data.items():
+            this_subset = value['subset']
+            if this_subset == subset:
+                if subset == 'testing':
+                    video_names.append('test/{}'.format(key))
+                else:
+                    label = value['annotations']['label']
+                    video_names.append('{}/{}'.format(label, key))
+                    annotations.append(value['annotations'])
+
+        return video_names, annotations
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/brats.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/brats.py
index 76fabff523b..e058f9a95c6 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/brats.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/brats.py
@@ -19,7 +19,7 @@
 
 from ..representation import BrainTumorSegmentationAnnotation
 from ..utils import get_path, read_txt, read_pickle, check_file_existence
-from ..config import StringField, PathField
+from ..config import StringField, PathField, BoolField
 from .format_converter import DirectoryBasedAnnotationConverter
 from ..representation.segmentation_representation import GTMaskLoader
 from .format_converter import ConverterReturn
@@ -34,7 +34,9 @@ def parameters(cls):
         parameters = super().parameters()
         parameters.update({
             'image_folder': StringField(optional=True, default='imagesTr', description="Image folder."),
-            'mask_folder': StringField(optional=True, default='labelsTr', description="Mask folder.")
+            'mask_folder': StringField(optional=True, default='labelsTr', description="Mask folder."),
+            'labels_file': PathField(optional=True, default=None, description="File with labels"),
+            'mask_channels_first': BoolField(optional=True, default=False)
         })
 
         return parameters
@@ -43,13 +45,15 @@ def configure(self):
         self.data_dir = self.get_value_from_config('data_dir')
         self.image_folder = self.get_value_from_config('image_folder')
         self.mask_folder = self.get_value_from_config('mask_folder')
+        self.labels_file = self.get_value_from_config('labels_file')
+        self.mask_channels_first = self.get_value_from_config('mask_channels_first')
 
     def convert(self, check_content=False, **kwargs):
         mask_folder = Path(self.mask_folder)
         image_folder = Path(self.image_folder)
         image_dir = get_path(self.data_dir / image_folder, is_directory=True)
         mask_dir = get_path(self.data_dir / mask_folder, is_directory=True)
-        content_check_erros = [] if check_content else None
+        content_check_errors = [] if check_content else None
 
         annotations = []
         for file_in_dir in image_dir.iterdir():
@@ -59,7 +63,7 @@ def convert(self, check_content=False, **kwargs):
                 if not check_content:
                     warnings.warn('Annotation mask for {} does not exists. File will be ignored.'.format(file_name))
                 else:
-                    content_check_erros.append(
+                    content_check_errors.append(
                         '{}: '.format(str(file_in_dir)) +
                         'annotation mask does not exists, please remove this file or add gt mask '
                         '({}).'.format(str(mask))
@@ -68,11 +72,17 @@ def convert(self, check_content=False, **kwargs):
             annotation = BrainTumorSegmentationAnnotation(
                 str(image_folder / file_name),
                 str(mask_folder / file_name),
+                loader=GTMaskLoader.NIFTI_CHANNELS_FIRST if self.mask_channels_first else GTMaskLoader.NIFTI
             )
 
             annotations.append(annotation)
 
-        return ConverterReturn(annotations, None, content_check_erros)
+        return ConverterReturn(annotations, self._get_meta(), content_check_errors)
+
+    def _get_meta(self):
+        if not self.labels_file:
+            return None
+        return {'label_map': dict(enumerate(read_txt(self.labels_file)))}
 
 
 class BratsNumpyConverter(DirectoryBasedAnnotationConverter):
@@ -148,4 +158,4 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
     def _get_meta(self):
         if not self.labels_file:
             return None
-        return {'label_map': [line for line in read_txt(self.labels_file)]}
+        return {'label_map': dict(enumerate(read_txt(self.labels_file)))}
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/camvid.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/camvid.py
index 3cb53356430..68ebe358980 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/camvid.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/camvid.py
@@ -1,6 +1,8 @@
-from .format_converter import FileBasedAnnotationConverter, ConverterReturn
+from .format_converter import FileBasedAnnotationConverter, ConverterReturn, verify_label_map
 from ..utils import read_txt, check_file_existence
 from ..representation import SegmentationAnnotation
+from ..config import PathField
+from ..utils import read_json
 
 
 class CamVidConverter(FileBasedAnnotationConverter):
@@ -11,23 +13,37 @@ class CamVidConverter(FileBasedAnnotationConverter):
             0: 'Sky',
             1: 'Building',
             2: 'Pole',
-            3: 'Road',
-            4: 'Pavement',
-            5: 'Tree',
-            6: 'SignSymbol',
-            7: 'Fence',
-            8: 'Car',
-            9: 'Pedestrian',
-            10: 'Bicyclist',
-            11: 'Unlabelled'
+            3: 'Road_marking',
+            4: 'Road',
+            5: 'Pavement',
+            6: 'Tree',
+            7: 'SignSymbol',
+            8: 'Fence',
+            9: 'Car',
+            10: 'Pedestrian',
+            11: 'Bicyclist',
+            12: 'Unlabelled'
         },
-        'background_label': 11,
+        'background_label': 12,
         'segmentation_colors': (
-            (128, 128, 128), (128, 0, 0), (192, 192, 128), (128, 64, 128), (60, 40, 222), (128, 128, 0),
+            (128, 128, 128), (128, 0, 0), (192, 192, 128), (255, 69, 0), (128, 64, 128), (60, 40, 222), (128, 128, 0),
             (192, 128, 128), (64, 64, 128), (64, 0, 128), (64, 64, 0), (0, 128, 192), (0, 0, 0)
         )
     }
 
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding', optional=True
+            )})
+        return params
+
+    def configure(self):
+        super().configure()
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
+
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         annotation = read_txt(self.annotation_file)
         annotations = []
@@ -45,5 +61,12 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             annotations.append(SegmentationAnnotation(identifier, gt_file))
             if progress_callback is not None and line_id % progress_interval == 0:
                 progress_callback(line_id * 100 / num_iterations)
+        meta = self.meta
+        if self.dataset_meta:
+            meta = read_json(self.dataset_meta)
+            if 'label_map' in meta:
+                meta['label_map'] = verify_label_map(meta['label_map'])
+            if 'labels' in meta and 'label_map' not in meta:
+                meta['label_map'] = dict(enumerate(meta['labels']))
 
-        return ConverterReturn(annotations, self.meta, content_errors)
+        return ConverterReturn(annotations, meta, content_errors)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cifar10.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cifar.py
similarity index 65%
rename from tools/accuracy_checker/accuracy_checker/annotation_converters/cifar10.py
rename to tools/accuracy_checker/accuracy_checker/annotation_converters/cifar.py
index 78501747523..743ec09db4b 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cifar10.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cifar.py
@@ -14,34 +14,66 @@
 limitations under the License.
 """
 
-from PIL import Image
 import numpy as np
-from ..config import PathField, BoolField
+from ..config import PathField, BoolField, NumberField
 from ..representation import ClassificationAnnotation
-from ..utils import read_pickle, check_file_existence
+from ..utils import read_pickle, check_file_existence, read_json
 
-from .format_converter import BaseFormatConverter, ConverterReturn
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
+
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
 
 CIFAR10_LABELS_LIST = [
     'airplane', 'automobile', 'bird', 'cat', 'deer',
     'dog', 'frog', 'horse', 'ship', 'truck'
 ]
 
+CIFAR100_LABELS_LIST = [
+    'beaver', 'dolphin', 'otter', 'seal', 'whale',
+    'aquarium fish', 'flatfish', 'ray', 'shark', 'trout',
+    'orchids', 'poppies', 'roses', 'sunflowers', 'tulips',
+    'bottles', 'bowls', 'cans', 'cups', 'plates',
+    'apples', 'mushrooms', 'oranges', 'pears', 'sweet peppers',
+    'clock', 'computer keyboard', 'lamp', 'telephone', 'television',
+    'bed', 'chair', 'couch', 'table', 'wardrobe',
+    'bee', 'beetle', 'butterfly', 'caterpillar', 'cockroach',
+    'bear', 'leopard', 'lion', 'tiger', 'wolf',
+    'bridge', 'castle', 'house', 'road', 'skyscraper',
+    'cloud', 'forest', 'mountain', 'plain', 'sea',
+    'camel', 'cattle', 'chimpanzee', 'elephant', 'kangaroo',
+    'fox', 'porcupine', 'possum', 'raccoon', 'skunk',
+    'crab', 'lobster', 'snail', 'spider', 'worm',
+    'baby', 'boy', 'girl', 'man', 'woman',
+    'crocodile', 'dinosaur', 'lizard', 'snake', 'turtle',
+    'hamster', 'mouse', 'rabbit', 'shrew', 'squirrel',
+    'maple', 'oak', 'palm', 'pine', 'willow',
+    'bicycle', 'bus', 'motorcycle', 'pickup truck', 'train',
+    'lawn-mower', 'rocket', 'streetcar', 'tank', 'tractor'
+]
+
+class_map = {
+    10: (CIFAR10_LABELS_LIST, 'labels'),
+    100: (CIFAR100_LABELS_LIST, 'fine_labels')
+}
 
-class Cifar10FormatConverter(BaseFormatConverter):
+
+class CifarFormatConverter(BaseFormatConverter):
     """
     cifar10 dataset converter. All annotation converters should be derived from BaseFormatConverter class.
     """
 
     # register name for this converter
     # this name will be used for converter class look up
-    __provider__ = 'cifar10'
+    __provider__ = 'cifar'
     annotation_types = (ClassificationAnnotation, )
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'data_batch_file': PathField(description="Path to pickle file which contain dataset batch."),
             'convert_images': BoolField(
                 optional=True,
@@ -55,11 +87,18 @@ def parameters(cls):
                 optional=True,
                 default=False,
                 description="Allows to add background label to original labels and convert dataset "
-                            "for 11 classes instead 10"
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding', optional=True
+            ),
+            'num_classes': NumberField(
+                optional=True, default=10, value_type=int,
+                description='the number of classes in the dataset without background (10 or 100)'
+
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         """
@@ -68,10 +107,16 @@ def configure(self):
         """
         self.data_batch_file = self.get_value_from_config('data_batch_file')
         self.has_background = self.get_value_from_config('has_background')
+        self.num_classes = self.get_value_from_config('num_classes')
         self.converted_images_dir = self.get_value_from_config('converted_images_dir')
         if not self.converted_images_dir:
             self.converted_images_dir = self.data_batch_file.parent / 'converted_images'
         self.convert_images = self.get_value_from_config('convert_images')
+        if self.convert_images and Image is None:
+            raise ValueError(
+                "conversion cifar images extraction requires Pillow installation, please install it before usage"
+            )
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         """
@@ -99,19 +144,23 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         annotation = []
         # read original dataset annotation
         annotation_dict = read_pickle(self.data_batch_file, encoding='latin1')
-        labels = annotation_dict['labels']
+        # Originally dataset labels start from 0, some networks can be trained with usage 1 as label start.
+        labels_offset = 0 if not self.has_background else 1
+        # crete metadata for dataset. Provided additional information is task specific and can includes, for example
+        # label_map, information about background, used class color representation (for semantic segmentation task)
+        # If your dataset does not have additional meta, you can to not provide it.
+        meta, label_names, labels_id = self.generate_meta(labels_offset)
+        labels = annotation_dict[labels_id]
         images = annotation_dict['data']
         images = images.reshape(images.shape[0], 3, 32, 32).astype(np.uint8)
         image_file = '{}_{}.png'
-        # Originally dataset labels start from 0, some networks can be trained with usage 1 as label start.
-        labels_offset = 0 if not self.has_background else 1
         num_iterations = len(labels)
         # convert each annotation object to ClassificationAnnotation
         for data_id, (label, feature) in enumerate(zip(labels, images)):
             # generate id of image which will be used for evaluation (usually name of file is used)
             # file name represented as {id}_{class}.png, where id is index of image in dataset,
             # label is text description of dataset class e.g. 1_cat.png
-            identifier = image_file.format(data_id, CIFAR10_LABELS_LIST[label])
+            identifier = image_file.format(data_id, label_names[label] if label_names else label)
             # Create representation for image. Provided parameters can be differ depends on task.
             # ClassificationAnnotation contains image identifier and label for evaluation.
             annotation.append(ClassificationAnnotation(identifier, label + labels_offset))
@@ -129,17 +178,21 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
 
             if progress_callback is not None and data_id % progress_interval == 0:
                 progress_callback(data_id / num_iterations * 100)
-        # crete metadata for dataset. Provided additional information is task specific and can includes, for example
-        # label_map, information about background, used class color representation (for semantic segmentation task)
-        # If your dataset does not have additional meta, you can to not provide it.
-        meta = {
-            'label_map': {
-                label_id + labels_offset: label_name for label_id, label_name in enumerate(CIFAR10_LABELS_LIST)
-            }
-        }
 
+        return ConverterReturn(annotation, meta, content_errors)
+
+    def generate_meta(self, labels_offset):
+        labels, labels_id = class_map.get(self.num_classes, ([], 'labels'))
+        meta = {}
+        if self.dataset_meta:
+            meta = read_json(self.dataset_meta)
+            if 'label_map' in meta:
+                meta['label_map'] = verify_label_map(meta['label_map'])
+                return meta
+            labels = meta.get('labels', labels)
+        meta.update({'label_map': {label_id + labels_offset: label_name for label_id, label_name in enumerate(labels)}})
         if self.has_background:
             meta['label_map'][0] = 'background'
             meta['background_label'] = 0
 
-        return ConverterReturn(annotation, meta, content_errors)
+        return meta, labels, labels_id
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cityscapes.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cityscapes.py
index 34100018c02..71bc8c43a7e 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cityscapes.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cityscapes.py
@@ -18,8 +18,8 @@
 from ..representation import SegmentationAnnotation
 from ..representation.segmentation_representation import GTMaskLoader
 from ..config import PathField, StringField, BoolField
-from .format_converter import BaseFormatConverter, ConverterReturn
-from ..utils import check_file_existence
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
+from ..utils import check_file_existence, read_json
 
 
 train_meta = {
@@ -66,8 +66,8 @@ class CityscapesConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'dataset_root_dir': PathField(is_directory=True, description="Path to dataset root."),
             'images_subfolder': StringField(
                 optional=True,
@@ -89,10 +89,13 @@ def parameters(cls):
                 optional=True,
                 default=False,
                 description="Allows to use full label map with 33 classes instead train label map with 18 classes."
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding', optional=True
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.dataset_root = self.get_value_from_config('dataset_root_dir')
@@ -101,6 +104,7 @@ def configure(self):
         self.masks_suffix = self.get_value_from_config('masks_suffix')
         self.images_suffix = self.get_value_from_config('images_suffix')
         self.use_full_label_map = self.get_value_from_config('use_full_label_map')
+        self.dataset_meta_file = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         images = list(self.dataset_root.rglob(r'{}/*/*{}.png'.format(self.images_dir, self.images_suffix)))
@@ -109,15 +113,24 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         num_iterations = len(images)
         for idx, image in enumerate(images):
             identifier = str(Path(self.images_dir).joinpath(*image.parts[-2:]))
-            mask = Path(self.masks_dir) / image.parts[-2] / self.masks_suffix.join(
+            mask = str(Path(self.masks_dir) / image.parts[-2] / self.masks_suffix.join(
                 str(image.name).split(self.images_suffix)
-            )
+            ))
             if check_content:
                 if not check_file_existence(self.dataset_root / mask):
                     content_errors.append('{}: does not exist'.format(self.dataset_root / mask))
             annotations.append(SegmentationAnnotation(identifier, mask, mask_loader=GTMaskLoader.PILLOW))
             if progress_callback is not None and idx % progress_interval == 0:
                 progress_callback(idx / num_iterations * 100)
-        meta = full_dataset_meta if self.use_full_label_map else train_meta
 
-        return ConverterReturn(annotations, meta, content_errors)
+        return ConverterReturn(annotations, self.generate_meta(), content_errors)
+
+    def generate_meta(self):
+        if self.dataset_meta_file is not None:
+            meta = read_json(self.dataset_meta_file)
+            if 'label_map' in meta:
+                meta['label_map'] = verify_label_map(meta['label_map'])
+            if 'labels' in meta and 'label_map' not in meta:
+                meta['label_map'] = dict(enumerate(meta['labels']))
+            return meta
+        return full_dataset_meta if self.use_full_label_map else train_meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cmu_panoptic.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cmu_panoptic.py
new file mode 100644
index 00000000000..14ac8379896
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cmu_panoptic.py
@@ -0,0 +1,131 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from pathlib import Path
+
+import cv2
+import numpy as np
+
+from ..utils import read_json, check_file_existence
+from ..representation import PoseEstimation3dAnnotation
+from .format_converter import DirectoryBasedAnnotationConverter, ConverterReturn
+
+
+class CmuPanopticKeypointsConverter(DirectoryBasedAnnotationConverter):
+    __provider__ = 'cmu_panoptic_keypoints'
+    annotation_types = (PoseEstimation3dAnnotation,)
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        images_dir_name = 'hdImgs'
+        labels_dir_name = 'hdPose3d_stage1_coco19'
+        label_prefix = 'body3DScene'
+        data, num_iterations = self._collect_data(self.data_dir, images_dir_name)
+
+        keypoints_annotations = []
+        content_errors = []
+        image_id = 0
+        for scene_dir, cameras_dir in data.items():
+            calibration_name = 'calibration_{}.json'.format(scene_dir.stem)
+            calibration = read_json(scene_dir / calibration_name)
+            for camera_dir, images_paths in cameras_dir.items():
+                camera_parameters = {}
+                for camera in calibration['cameras']:
+                    if camera['type'] != 'hd':
+                        continue
+                    if camera['name'] != camera_dir.stem:
+                        continue
+                    camera_parameters = {
+                        'K': np.array(camera['K'], dtype=np.float32),
+                        'distCoef': np.array(camera['distCoef'], dtype=np.float32),
+                        'R': np.array(camera['R'], dtype=np.float32),
+                        't': np.array(camera['t'], dtype=np.float32)}
+                    break
+
+                for image_path in images_paths:
+                    if check_content:
+                        if not check_file_existence(image_path):
+                            content_errors.append('{}: does not exist'.format(image_path))
+                    label_name = image_path.name.replace(camera_dir.stem, label_prefix)
+                    label_path = scene_dir / labels_dir_name / label_name.replace('jpg', 'json')
+                    label = read_json(label_path)
+
+                    annotations = []
+                    for body_id in range(len(label['bodies'])):
+                        body = label['bodies'][body_id]
+                        skel = np.array(body['joints19']).reshape((-1, 4)).transpose()
+                        annotations.append({'id': body_id, 'body': skel})
+
+                    keypoints_2d = CmuPanopticKeypointsConverter._project_3d_keypoints_to_frame(
+                        annotations, camera_parameters)
+                    keypoints_3d = CmuPanopticKeypointsConverter._to_camera_space(
+                        annotations, camera_parameters['R'], camera_parameters['t'])
+
+                    identifier = Path(*image_path.parts[-4:])
+                    keypoints_annotation = PoseEstimation3dAnnotation(
+                        identifier, keypoints_2d[:, 0].astype(np.float32), keypoints_2d[:, 1].astype(np.float32),
+                        np.full_like(keypoints_2d[:, 1].astype(np.float32), 1),
+                        x_3d_values=keypoints_3d[:, 0], y_3d_values=keypoints_3d[:, 1], z_3d_values=keypoints_3d[:, 2],
+                        fx=camera_parameters['K'][0, 0])
+                    keypoints_annotations.append(keypoints_annotation)
+                    if progress_callback is not None and image_id & progress_interval == 0:
+                        progress_callback(image_id / num_iterations * 100)
+                    image_id += 1
+
+        return ConverterReturn(keypoints_annotations, None, content_errors)
+
+    @staticmethod
+    def _project_3d_keypoints_to_frame(annotations, camera_parameters):
+        keypoints_2d = []
+        for annotation in annotations:
+            pt = cv2.projectPoints(annotation['body'][0:3, :].transpose().copy(),
+                                   cv2.Rodrigues(camera_parameters['R'])[0],
+                                   camera_parameters['t'],
+                                   camera_parameters['K'],
+                                   camera_parameters['distCoef'])
+            pt = np.squeeze(pt[0], axis=1).transpose()
+
+            keypoints_2d.append(pt)
+
+        return np.array(keypoints_2d)
+
+    @staticmethod
+    def _to_camera_space(annotations, R, t):
+        keypoints_3d = np.zeros((len(annotations),
+                                 annotations[0]['body'].shape[0],
+                                 annotations[0]['body'].shape[1]), dtype=np.float32)
+        for pose_id, annotation in enumerate(annotations):
+            keypoints_in_camera_space = annotation['body']
+            keypoints_in_camera_space[:3, :] = np.dot(R, keypoints_in_camera_space[:3, :]) + t
+            keypoints_3d[pose_id] = keypoints_in_camera_space
+
+        return keypoints_3d
+
+    @staticmethod
+    def _collect_data(data_dir, images_dir_name):
+        data = {}
+        num_iterations = 0
+        for scene_dir in data_dir.iterdir():
+            if not scene_dir.is_dir():
+                continue
+            data[scene_dir] = {}
+            scene_images_dir = scene_dir / images_dir_name
+            for camera_dir in scene_images_dir.iterdir():
+                if not camera_dir.is_dir():
+                    continue
+                data[scene_dir][camera_dir] = list(camera_dir.rglob('*.jpg'))
+                num_iterations += len(data[scene_dir][camera_dir])
+
+        return data, num_iterations
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/common_semantic_segmentation.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/common_semantic_segmentation.py
index c853c22ac93..0e6d0627f47 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/common_semantic_segmentation.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/common_semantic_segmentation.py
@@ -1,6 +1,7 @@
 from pathlib import Path
 from ..config import PathField, StringField
-from .format_converter import BaseFormatConverter, ConverterReturn
+from ..logging import warning
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
 from ..representation.segmentation_representation import LOADERS_MAPPING
 from ..representation import SegmentationAnnotation
 from ..utils import read_json
@@ -11,8 +12,8 @@ class CommonSegmentationConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update(
+        configuration_parameters = super().parameters()
+        configuration_parameters.update(
             {
                 'images_dir': PathField(description='path to input images directory', is_directory=True),
                 'masks_dir': PathField(description='path to gt masks directory', is_directory=True),
@@ -25,12 +26,12 @@ def parameters(cls):
                     description='reader for gt masks. Supported: {}'.format(', '.join(LOADERS_MAPPING)),
                     default='pillow'
                 ),
-                'dataset_meta': PathField(
+                'dataset_meta_file': PathField(
                     description='path to json file with dataset meta (e.g. label_map, color_encoding', optional=True
                 )
             }
         )
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.images_dir = self.get_value_from_config('images_dir')
@@ -40,7 +41,7 @@ def configure(self):
         self.mask_prefix = self.get_value_from_config('mask_prefix')
         self.mask_postfix = self.get_value_from_config('mask_postfix')
         self.mask_loader = LOADERS_MAPPING[self.get_value_from_config('mask_loader')]
-        self.dataset_meta = self.get_value_from_config('dataset_meta')
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         annotations = []
@@ -72,6 +73,15 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             if progress_callback is not None and idx % progress_interval == 0:
                 progress_callback(idx / num_iterations * 100)
 
-        dataset_meta = read_json(self.dataset_meta) if self.dataset_meta else None
+        dataset_meta = None
+        if self.dataset_meta:
+            dataset_meta = read_json(self.dataset_meta)
+            if 'label_map' not in dataset_meta:
+                if 'labels' in dataset_meta:
+                    dataset_meta['label_map'] = dict(enumerate(dataset_meta['labels']))
+                else:
+                    warning("Information about dataset labels is provided. Please provide it for metric calculation.")
+            else:
+                dataset_meta['label_map'] = verify_label_map(dataset_meta['label_map'])
 
         return ConverterReturn(annotations, dataset_meta, content_errors)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/convert.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/convert.py
index 4c2fc2e40ab..4acb685ffa4 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/convert.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/convert.py
@@ -32,7 +32,7 @@
 
 def build_argparser():
     parser = ArgumentParser(
-        description="Converts annotation form a arbitrary format to accuracy-checker specific format", add_help=False
+        description="Converts annotation form an arbitrary format to accuracy-checker specific format", add_help=False
     )
     parser.add_argument(
         "converter",
@@ -74,7 +74,7 @@ def get_pairs(pairs_list):
 
         subsample_set = OrderedSet()
         potential_ann_ind = np.random.choice(len(annotation), size, replace=False)
-        for ann_ind in potential_ann_ind:
+        for ann_ind in potential_ann_ind: # pylint: disable=E1133
             annotation_for_subset = annotation[ann_ind]
             positive_pairs = annotation_for_subset.positive_pairs
             negative_pairs = annotation_for_subset.negative_pairs
@@ -147,10 +147,16 @@ def main():
 
 def save_annotation(annotation, meta, annotation_file, meta_file):
     if annotation_file:
+        annotation_dir = annotation_file.parent
+        if not annotation_dir.exists():
+            annotation_dir.mkdir(parents=True)
         with annotation_file.open('wb') as file:
             for representation in annotation:
                 representation.dump(file)
     if meta_file and meta:
+        meta_dir = meta_file.parent
+        if not meta_dir.exists():
+            meta_dir.mkdir(parents=True)
         with meta_file.open('wt') as file:
             json.dump(meta, file)
 
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_age_gender_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_age_gender_recognition.py
index ea2b487a625..926708a2b47 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_age_gender_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_age_gender_recognition.py
@@ -26,14 +26,14 @@ class CVATAgeGenderRecognitionConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_attributes_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_attributes_recognition.py
index 7982ac263b8..4eec9d6c698 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_attributes_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_attributes_recognition.py
@@ -28,15 +28,15 @@ class CVATAttributesRecognitionConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'label': StringField(description='specific label for attribute collection'),
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_facial_landmarks.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_facial_landmarks.py
index 319305017eb..ce2b8c0a20e 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_facial_landmarks.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_facial_landmarks.py
@@ -27,14 +27,14 @@ class CVATFacialLandmarksRecognitionConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_human_pose.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_human_pose.py
index 012a6a2c11e..03b8a288c7d 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_human_pose.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_human_pose.py
@@ -47,14 +47,14 @@ class CVATPoseEstimationConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_multilabel_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_multilabel_recognition.py
index 628fe9d4ed4..00cea2d0390 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_multilabel_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_multilabel_recognition.py
@@ -27,15 +27,15 @@ class CVATMultilabelAttributesRecognitionConverter(FileBasedAnnotationConverter)
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'label': StringField(description='specific label for attribute collection'),
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_object_detection.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_object_detection.py
index 5df376d9b5d..d52acd475e3 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_object_detection.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_object_detection.py
@@ -28,39 +28,32 @@ class CVATObjectDetectionConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             ),
             'has_background': BoolField(optional=True, default=True, description='Dataset has background label or not'),
-            'labels_file': PathField(optional=True, description='path to label map in json format')
+            'labels_file': PathField(optional=True, description='path to label map in json format'),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
+            )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
         self.has_background = self.get_value_from_config('has_background')
         self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
         self.label_map_file = self.get_value_from_config('labels_file')
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         annotation = read_xml(self.annotation_file)
-        meta = annotation.find('meta')
-        size = int(meta.find('task').find('size').text)
-        if self.label_map_file:
-            label_to_id = read_json(self.label_map_file).get('labels')
-            if not label_to_id:
-                raise ConfigError('label_map_file does not contains labels key')
-        else:
-            labels = [label.find('name').text for label in meta.iter('label') if label.find('name').text]
-            if not labels:
-                raise ConfigError('annotation file does not contains labels')
-            if self.has_background:
-                labels = ['background'] + labels
-            label_to_id = {label: idx for idx, label in enumerate(labels)}
-
+        annotation_meta = annotation.find('meta')
+        size = int(annotation_meta.find('task').find('size').text)
+        label_to_id, meta = self.generate_labels_mapping(annotation_meta)
         annotations = []
         content_errors = None if not check_content else []
         for image_id, image in enumerate(annotation.iter('image')):
@@ -85,11 +78,39 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             if progress_callback is not None and image_id % progress_interval == 0:
                 progress_callback(image_id * 100 / size)
 
-        return ConverterReturn(annotations, self.generate_meta(label_to_id), content_errors)
+        return ConverterReturn(annotations, meta, content_errors)
+
+    def generate_labels_mapping(self, annotation_meta):
+        if self.dataset_meta:
+            meta = read_json(self.dataset_meta)
+            if 'labels' in meta and 'label_map' not in meta:
+                offset = int(self.has_background)
+                label_to_id = {label_name: label_id + offset for label_id, label_name in enumerate(meta['labels'])}
+                meta['label_map'] = {'label_map': {value: key for key, value in label_to_id.items()}}
+                if self.has_background:
+                    meta['label_map'][0] = 'background'
+                    meta['background_label'] = 0
 
-    def generate_meta(self, values_mapping):
-        meta = {'label_map': {value: key for key, value in values_mapping.items()}}
-        if self.has_background:
-            meta['background_label'] = 0
+            label_map = meta.get('label_map')
+            if not label_map:
+                raise ConfigError('dataset_meta_file should contains labels or label_map')
+            label_to_id = {value: key for key, value in label_map.items()}
+
+            return label_to_id, meta
+
+        meta = {}
+        if self.label_map_file:
+            label_to_id = read_json(self.label_map_file).get('labels')
+            if not label_to_id:
+                raise ConfigError('label_map_file does not contains labels key')
+        else:
+            labels = [label.find('name').text for label in annotation_meta.iter('label') if label.find('name').text]
+            if not labels:
+                raise ConfigError('annotation file does not contains labels')
+            if self.has_background:
+                labels = ['background'] + labels
+                meta['background_label'] = 0
+            label_to_id = {label: idx for idx, label in enumerate(labels)}
+        meta['label_map'] = {value: key for key, value in label_to_id.items()}
 
-        return meta
+        return label_to_id, meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_person_detection_action_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_person_detection_action_recognition.py
index 467f362f0c1..6c1a0025c45 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_person_detection_action_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_person_detection_action_recognition.py
@@ -100,8 +100,8 @@ class CVATPersonDetectionActionRecognitionConverter(FileBasedAnnotationConverter
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
@@ -112,7 +112,7 @@ def parameters(cls):
                             "Supported range actions: {}".format(', '.join(ACTIONS.keys()))
             ),
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_text_recognition.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_text_recognition.py
index aa078e9eb13..10ac39aea20 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_text_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/cvat_text_recognition.py
@@ -27,14 +27,14 @@ class CVATTextRecognitionConverter(FileBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
             ),
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/detection_opencv_storage.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/detection_opencv_storage.py
index b87ec9dbceb..49c90262c1e 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/detection_opencv_storage.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/detection_opencv_storage.py
@@ -14,11 +14,11 @@
 limitations under the License.
 """
 
-from ..config import PathField, NumberField
+from ..config import PathField, NumberField, ConfigError
 from ..representation import DetectionAnnotation
-from ..utils import convert_bboxes_xywh_to_x1y1x2y2, read_xml, read_txt, check_file_existence
+from ..utils import convert_bboxes_xywh_to_x1y1x2y2, read_xml, read_txt, check_file_existence, read_json
 
-from .format_converter import BaseFormatConverter, ConverterReturn
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
 
 
 class DetectionOpenCVStorageFormatConverter(BaseFormatConverter):
@@ -27,8 +27,8 @@ class DetectionOpenCVStorageFormatConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(description="Path to annotation in xml format."),
             'image_names_file': PathField(
                 optional=True,
@@ -48,9 +48,13 @@ def parameters(cls):
             'data_dir': PathField(
                 is_directory=True, optional=True,
                 description='this parameter used only for dataset image existence validation purposes.'
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
-        return parameters
+
+        return configuration_parameters
 
     def configure(self):
         self.annotation_file = self.get_value_from_config('annotation_file')
@@ -60,6 +64,7 @@ def configure(self):
         self.data_dir = self.get_value_from_config('data_dir')
         if self.data_dir is None:
             self.data_dir = self.annotation_file.parent
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         def update_progress(frame_id):
@@ -67,15 +72,9 @@ def update_progress(frame_id):
                 progress_callback(frame_id / num_iterations * 100)
 
         root = read_xml(self.annotation_file)
+        class_to_ind, meta = self.generate_meta(root)
 
-        labels_set = self.get_label_set(root)
-
-        labels_set = sorted(labels_set)
-        class_to_ind = dict(zip(labels_set, list(range(self.label_start, len(labels_set) + self.label_start + 1))))
-        label_map = {}
         content_check_errors = None
-        for class_label, ind in class_to_ind.items():
-            label_map[ind] = class_label
 
         annotations = []
         for frames in root:
@@ -119,12 +118,6 @@ def update_progress(frame_id):
                 if not check_file_existence(self.data_dir / annotation.identifier):
                     content_check_errors.append('{}: file not found'.format(self.data_dir / annotation.identifier))
 
-        meta = {}
-        if self.background_label:
-            label_map[self.background_label] = '__background__'
-            meta['background_label'] = self.background_label
-        meta['label_map'] = label_map
-
         return ConverterReturn(annotations, meta, content_check_errors)
 
     @staticmethod
@@ -134,7 +127,6 @@ def rename_identifiers(annotation_list, images_file):
 
         return annotation_list
 
-
     @staticmethod
     def get_label_set(xml_root):
         labels_set = set()
@@ -148,3 +140,37 @@ def get_label_set(xml_root):
                     labels_set.add(label)
 
         return labels_set
+
+    def generate_meta(self, root):
+        if self.dataset_meta:
+            meta = read_json(self.dataset_meta)
+            if 'labels' in meta and 'label_map' not in meta:
+                labels_set = meta['labels']
+                class_to_ind = dict(
+                    zip(labels_set, list(range(self.label_start, len(labels_set) + self.label_start + 1)))
+                )
+                meta['label_map'] = {'label_map': {value: key for key, value in class_to_ind.items()}}
+                if self.background_label:
+                    meta['label_map'][self.background_label] = '__background__'
+                    meta['background_label'] = 0
+            label_map = meta.get('label_map')
+            if not label_map:
+                raise ConfigError('dataset_meta_file should contains labels or label_map')
+            label_map = verify_label_map(label_map)
+            class_to_ind = {value: key for key, value in label_map.items()}
+
+            return class_to_ind, meta
+
+        labels_set = self.get_label_set(root)
+        labels_set = sorted(labels_set)
+        class_to_ind = dict(zip(labels_set, list(range(self.label_start, len(labels_set) + self.label_start + 1))))
+        label_map = {}
+        for class_label, ind in class_to_ind.items():
+            label_map[ind] = class_label
+        meta = {}
+        if self.background_label:
+            label_map[self.background_label] = '__background__'
+            meta['background_label'] = self.background_label
+        meta['label_map'] = label_map
+
+        return class_to_ind, meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/fashion_mnist.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/fashion_mnist.py
new file mode 100644
index 00000000000..2151e590e65
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/fashion_mnist.py
@@ -0,0 +1,139 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import gzip
+import numpy as np
+from ..config import PathField, BoolField
+from ..representation import ClassificationAnnotation
+from ..utils import check_file_existence, read_json
+
+from .format_converter import BaseFormatConverter, ConverterReturn
+
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
+
+
+class FashionMnistConverter(BaseFormatConverter):
+    """
+    Fashion MNist dataset converter. All annotation converters should be derived from BaseFormatConverter class.
+    """
+
+    # register name for this converter
+    # this name will be used for converter class look up
+    __provider__ = 'fashion_mnist'
+    annotation_types = (ClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
+            'annotation_file': PathField(description="Path to annotation in binary format."),
+            'data_file': PathField(description="Path to data in binary format."),
+            'convert_images': BoolField(
+                optional=True,
+                default=False,
+                description="Allows to convert images to user specified directory."
+            ),
+            'converted_images_dir': PathField(
+                optional=True, is_directory=True, check_exists=False, description="Path to converted images location."
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
+            )
+        })
+
+        return configuration_parameters
+
+    def configure(self):
+        """
+        This method is responsible for obtaining the necessary parameters
+        for converting from the command line or config.
+        """
+        self.test_anno_file = self.get_value_from_config('annotation_file')
+        self.test_data_file = self.get_value_from_config('data_file')
+        self.converted_images_dir = self.get_value_from_config('converted_images_dir')
+        self.convert_images = self.get_value_from_config('convert_images')
+        if self.convert_images and not self.converted_images_dir:
+            self.converted_images_dir = self.test_anno_file.parent / 'converted_images'
+            if not self.converted_images_dir.exists():
+                self.converted_images_dir.mkdir(parents=True)
+        if self.convert_images and Image is None:
+            raise ValueError(
+                "conversion fashion mnist images requires Pillow installation, please install it before usage"
+            )
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        """
+        This method is executed automatically when convert.py is started.
+        All arguments are automatically got from command line arguments or config file in method configure
+
+        Returns:
+            annotations: list of annotation representation objects.
+            meta: dictionary with additional dataset level metadata.
+        """
+        annotations = []
+        check_images = check_content and not self.convert_images
+        meta = self.generate_meta()
+        content_errors = None
+        if check_content:
+            self.converted_images_dir = self.converted_images_dir or self.test_anno_file.parent / 'converted_images'
+
+        if self.converted_images_dir and check_content:
+            if not self.converted_images_dir.exists():
+                content_errors = ['{}: does not exist'.format(self.converted_images_dir)]
+                check_images = False
+        # read original dataset annotation
+
+        with gzip.open(str(self.test_anno_file), 'rb') as lbpath:
+            labels = np.frombuffer(lbpath.read(), dtype=np.uint8, offset=8)
+
+        with gzip.open(str(self.test_data_file), 'rb') as imgpath:
+            images = np.frombuffer(imgpath.read(), dtype=np.uint8, offset=16).reshape(len(labels), 784)
+
+        num_iterations = len(labels)
+        for index, annotation in enumerate(labels):
+            identifier = '{}.png'.format(index)
+            label = int(annotation)
+            if self.convert_images:
+                image = Image.fromarray(images[index].reshape(28, 28))
+                image = image.convert("L")
+                image.save(str(self.converted_images_dir / identifier))
+            annotations.append(ClassificationAnnotation(identifier, label))
+            if check_images:
+                if not check_file_existence(self.converted_images_dir / identifier):
+                    # add error to errors list if file not found
+                    content_errors.append('{}: does not exist'.format(self.converted_images_dir / identifier))
+
+            if progress_callback is not None and index % progress_interval == 0:
+                progress_callback(index / num_iterations * 100)
+
+        return ConverterReturn(annotations, meta, content_errors)
+
+    def generate_meta(self):
+        default_labels = ['T-shirt/top', 'Trouser', 'Pullover', 'Dress', 'Coat', 'Sandal', 'Shirt', 'Sneaker',
+                          'Bag', 'Ankle boot']
+        if not self.dataset_meta:
+            return {'label_map': dict(enumerate(default_labels))}
+        dataset_meta = read_json(self.dataset_meta)
+        label_map = dataset_meta.get('label_map')
+        if 'labels' in dataset_meta:
+            label_map = dict(enumerate(dataset_meta['labels']))
+        dataset_meta['label_map'] = label_map or dict(enumerate(default_labels))
+
+        return dataset_meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/format_converter.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/format_converter.py
index 2679a3e6a39..464c9b203f6 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/format_converter.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/format_converter.py
@@ -18,7 +18,7 @@
 from collections import namedtuple
 
 from ..topology_types import GenericTopology
-from ..config import ConfigValidator, StringField, PathField
+from ..config import ConfigValidator, StringField, PathField, ConfigError
 from ..dependency import ClassProvider
 from ..utils import format_key, get_parameter_value_from_config
 
@@ -124,3 +124,16 @@ def configure(self):
 
     def convert(self, check_content=False, **kwargs):
         pass
+
+
+def verify_label_map(label_map):
+    valid_label_map = {}
+    for class_id, class_name in label_map.items():
+        try:
+            int_class_id = int(class_id)
+            valid_label_map[int_class_id] = class_name
+        except ValueError:
+            raise ConfigError(
+                'class_id {} is invalid. `label_map` should have integer keys.'.format(class_id)
+            )
+    return valid_label_map
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/icdar.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/icdar.py
index fa3eb4dfd47..557a02883f5 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/icdar.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/icdar.py
@@ -18,12 +18,59 @@
 from ..representation import TextDetectionAnnotation, CharacterRecognitionAnnotation
 from ..utils import read_txt, check_file_existence
 from .format_converter import FileBasedAnnotationConverter, DirectoryBasedAnnotationConverter, ConverterReturn
-from ..config import PathField
+from ..config import PathField, BoolField
 
 
 def box_to_points(box):
     return np.array([[box[0][0], box[0][1]], [box[1][0], box[0][1]], [box[1][0], box[1][1]], [box[0][0], box[1][1]]])
 
+def strip(text):
+    if text.lower().endswith("'s"):
+        text = text[:-2]
+    text = text.strip('-')
+    for c in "'!?.:,*\"()\N{MIDDLE DOT}[]/":
+        text = text.replace(c, ' ')
+    text = text.strip()
+
+    return text
+
+def is_word(text):
+
+    text = strip(text)
+
+    if ' ' in text:
+        return False
+
+    if len(text) < 3:
+        return False
+
+    forbidden_symbols = "\N{MULTIPLICATION SIGN}\N{DIVISION SIGN}\N{GREEK ANO TELEIA}"
+
+    range1 = [ord(u'a'), ord(u'z')]
+    range2 = [ord(u'A'), ord(u'Z')]
+    range3 = [ord(u'\N{LATIN CAPITAL LETTER A WITH GRAVE}'),
+              ord(u'\N{LATIN LETTER WYNN}')]
+    range4 = [ord(u'\N{LATIN CAPITAL LETTER DZ WITH CARON}'),
+              ord(u'\N{LATIN SMALL LETTER REVERSED R WITH FISHHOOK}')]
+    range5 = [ord(u'\N{GREEK CAPITAL LETTER ALPHA WITH TONOS}'),
+              ord(u'\N{GREEK CAPITAL REVERSED DOTTED LUNATE SIGMA SYMBOL}')]
+    range6 = [ord(u'-'), ord(u'-')]
+
+    for char in text:
+        char_code = ord(char)
+        if char in forbidden_symbols:
+            return False
+
+        if not (range1[0] <= char_code <= range1[1] or
+                range2[0] <= char_code <= range2[1] or
+                range3[0] <= char_code <= range3[1] or
+                range4[0] <= char_code <= range4[1] or
+                range5[0] <= char_code <= range5[1] or
+                range6[0] <= char_code <= range6[1]):
+            return False
+
+    return True
+
 
 class ICDAR15DetectionDatasetConverter(DirectoryBasedAnnotationConverter):
     __provider__ = 'icdar_detection'
@@ -31,20 +78,26 @@ class ICDAR15DetectionDatasetConverter(DirectoryBasedAnnotationConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update(
+        configuration_parameters = super().parameters()
+        configuration_parameters.update(
             {
                 'images_dir': PathField(
                     is_directory=True, optional=True,
                     description='path to dataset images, used only for content existence check'
+                ),
+                'word_spotting': BoolField(
+                    optional=True, default=False,
+                    description='transcriptions that have lengths less than 3 symbols or '
+                                'transcriptions containing non-alphanumeric symbols will be marked as difficult'
                 )
             }
         )
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         super().configure()
         self.images_dir = self.get_value_from_config('images_dir')
+        self.word_spotting = self.get_value_from_config('word_spotting')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         annotations = []
@@ -72,6 +125,11 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
                     points = box_to_points(points)
                 if transcription == '###':
                     difficult.append(len(transcriptions))
+                elif self.word_spotting:
+                    if not is_word(transcription):
+                        difficult.append(len(transcriptions))
+                    else:
+                        transcription = strip(transcription)
                 all_points.append(points)
                 transcriptions.append(transcription)
             annotation = TextDetectionAnnotation(identifier, all_points, transcriptions)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/imagenet.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/imagenet.py
index 51ec4e4af0b..e318a665174 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/imagenet.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/imagenet.py
@@ -18,10 +18,10 @@
 
 from ..config import PathField, BoolField
 from ..representation import ClassificationAnnotation
-from ..utils import read_txt, get_path, check_file_existence
+from ..utils import read_txt, get_path, check_file_existence, read_json
 
 from ..topology_types import ImageClassification
-from .format_converter import BaseFormatConverter, ConverterReturn
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
 
 
 class ImageNetFormatConverter(BaseFormatConverter):
@@ -31,8 +31,8 @@ class ImageNetFormatConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(description="Path to annotation in txt format."),
             'labels_file': PathField(
                 optional=True,
@@ -46,15 +46,19 @@ def parameters(cls):
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.annotation_file = self.get_value_from_config('annotation_file')
         self.labels_file = self.get_value_from_config('labels_file')
         self.has_background = self.get_value_from_config('has_background')
         self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         annotation = []
@@ -72,24 +76,37 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             if progress_callback is not None and image_id % progress_interval == 0:
                 progress_callback(image_id / num_iterations * 100)
 
-        meta = self._create_meta(self.labels_file, self.has_background) if self.labels_file else None
+        meta = self._create_meta(self.labels_file, self.dataset_meta, self.has_background) or None
 
         return ConverterReturn(annotation, meta, content_errors)
 
     @staticmethod
-    def _create_meta(labels_file, has_background=False):
+    def _create_meta(labels_file, dataset_meta, has_background=False):
         meta = {}
-        labels = {}
-        for i, line in enumerate(read_txt(get_path(labels_file))):
-            index_for_label = i if not has_background else i + 1
-            line = line.strip()
-            label = line[line.find(' ') + 1:]
-            labels[index_for_label] = label
+        label_map = {}
+        if dataset_meta:
+            meta = read_json(dataset_meta)
+            if 'labels' in dataset_meta and 'label_map' not in meta:
+                labels = ['background'] + meta['labels'] if has_background else meta['labels']
+                label_map = dict(enumerate(labels))
+                meta['label_map'] = label_map
+            else:
+                if 'label_map' in meta:
+                    meta['label_map'] = verify_label_map(meta['label_map'])
+                return meta
+
+        if labels_file:
+            label_map = {}
+            for i, line in enumerate(read_txt(get_path(labels_file))):
+                index_for_label = i if not has_background else i + 1
+                line = line.strip()
+                label = line[line.find(' ') + 1:]
+                label_map[index_for_label] = label
+
+            meta['label_map'] = label_map
 
         if has_background:
-            labels[0] = 'background'
-            meta['backgound_label'] = 0
-
-        meta['label_map'] = labels
+            label_map[0] = 'background'
+            meta['background_label'] = 0
 
         return meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/lfw.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/lfw.py
index 1c8caf3c051..455fd9c3b28 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/lfw.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/lfw.py
@@ -30,8 +30,8 @@ class LFWConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'pairs_file': PathField(description="Path to file with annotation positive and negative pairs."),
             'landmarks_file': PathField(
                 optional=True, description="Path to file with facial landmarks coordinates for annotation images."
@@ -42,7 +42,7 @@ def parameters(cls):
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.pairs_file = self.get_value_from_config('pairs_file')
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/lpr.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/lpr.py
index 13f581e345a..7295b207917 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/lpr.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/lpr.py
@@ -26,8 +26,8 @@ class LPRConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(description="Path to annotation (.txt)."),
             'decoding_dictionary_file': PathField(
                 optional=True, description="Path to file containing dictionary for output decoding."
@@ -38,7 +38,7 @@ def parameters(cls):
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self, *args, **kwargs):
         self.annotation_file = self.get_value_from_config('annotation_file')
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/mnist.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/mnist.py
index e1a6f73206c..6b2847d0ef2 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/mnist.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/mnist.py
@@ -14,14 +14,18 @@
 limitations under the License.
 """
 
-from PIL import Image
 import numpy as np
 from ..config import PathField, BoolField
 from ..representation import ClassificationAnnotation
-from ..utils import read_csv, check_file_existence
+from ..utils import read_csv, check_file_existence, read_json
 
 from .format_converter import BaseFormatConverter, ConverterReturn
 
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
+
 
 class MNISTCSVFormatConverter(BaseFormatConverter):
     """
@@ -35,8 +39,8 @@ class MNISTCSVFormatConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(description="Path to csv file which contain dataset."),
             'convert_images': BoolField(
                 optional=True,
@@ -46,9 +50,12 @@ def parameters(cls):
             'converted_images_dir': PathField(
                 optional=True, is_directory=True, check_exists=False, description="Path to converted images location."
             ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
+            )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         """
@@ -63,6 +70,12 @@ def configure(self):
             if not self.converted_images_dir.exists():
                 self.converted_images_dir.mkdir(parents=True)
 
+        if self.convert_images and Image is None:
+            raise ValueError(
+                "conversion mnist images requires Pillow installation, please install it before usage"
+            )
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
+
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         """
         This method is executed automatically when convert.py is started.
@@ -74,6 +87,8 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         """
         annotations = []
         check_images = check_content and not self.convert_images
+        meta = self.generate_meta()
+        labels_to_id = meta['label_map']
         content_errors = None
         if check_content:
             self.converted_images_dir = self.converted_images_dir or self.test_csv_file.parent / 'converted_images'
@@ -87,7 +102,7 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         num_iterations = len(annotation_table)
         for index, annotation in enumerate(annotation_table):
             identifier = '{}.png'.format(index)
-            label = int(annotation['label'])
+            label = labels_to_id.get(annotation['label'], int(annotation['label']))
             if self.convert_images:
                 image = Image.fromarray(self.convert_image(annotation))
                 image = image.convert("L")
@@ -101,9 +116,7 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             if progress_callback is not None and index % progress_interval == 0:
                 progress_callback(index / num_iterations * 100)
 
-        meta = {'label_map': {str(i): i for i in range(10)}}
-
-        return ConverterReturn(annotations, meta, None)
+        return ConverterReturn(annotations, meta, content_errors)
 
     @staticmethod
     def convert_image(features):
@@ -115,3 +128,14 @@ def convert_image(features):
                 image[x, y] = pixel
 
         return image
+
+    def generate_meta(self):
+        if not self.dataset_meta:
+            return {'label_map': {str(i): i for i in range(10)}}
+        dataset_meta = read_json(self.dataset_meta)
+        label_map = dataset_meta.get('label_map')
+        if 'labels' in dataset_meta:
+            label_map = dict(enumerate(dataset_meta['labels']))
+        dataset_meta['label_map'] = label_map or {str(i): i for i in range(10)}
+
+        return dataset_meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_asl_continuous.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_asl_continuous.py
new file mode 100644
index 00000000000..4595702298e
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_asl_continuous.py
@@ -0,0 +1,155 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from ..utils import read_txt, check_file_existence
+from ..representation import ClassificationAnnotation
+from ..data_readers import ClipIdentifier
+from ..config import PathField, NumberField
+
+from .format_converter import BaseFormatConverter, ConverterReturn
+
+
+class RawFramesSegmentedRecord:
+    def __init__(self, row):
+        self._data = row
+
+        assert self.video_num_frames > 0
+        assert self.num_frames > 0
+        assert self.fps > 0
+        assert self.label >= 0
+        assert self.clip_start >= self.video_start >= 0
+        assert self.video_end >= self.clip_end >= 0
+
+    @property
+    def path(self):
+        return self._data[0]
+
+    @property
+    def label(self):
+        return int(self._data[1])
+
+    @property
+    def clip_start(self):
+        return int(self._data[2])
+
+    @property
+    def clip_end(self):
+        return int(self._data[3])
+
+    @property
+    def video_start(self):
+        return int(self._data[4])
+
+    @property
+    def video_end(self):
+        return int(self._data[5])
+
+    @property
+    def fps(self):
+        return float(self._data[6])
+
+    @property
+    def num_frames(self):
+        return self.clip_end - self.clip_start
+
+    @property
+    def video_num_frames(self):
+        return self.video_end - self.video_start
+
+
+class MSASLContiniousConverter(BaseFormatConverter):
+    __provider__ = 'continuous_clip_action_recognition'
+    annotation_types = (ClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'annotation_file': PathField(description="Path to annotation file."),
+            'data_dir': PathField(is_directory=True, description="Path to data directory."),
+            'out_fps': NumberField(
+                value_type=float, optional=True, min_value=1, default=15, description="Output FPS."
+            ),
+            'clip_length': NumberField(
+                value_type=int, optional=True, min_value=1, default=16, description="Clip length."
+            )
+        })
+
+        return params
+
+    def configure(self):
+        self.annotation_file = self.get_value_from_config('annotation_file')
+        self.data_dir = self.get_value_from_config('data_dir')
+        self.out_fps = self.get_value_from_config('out_fps')
+        self.clip_length = self.get_value_from_config('clip_length')
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        records = self.load_annotations(self.annotation_file)
+
+        annotations = []
+        num_iterations = len(records)
+        content_errors = None if not check_content else []
+        for record_idx, record in enumerate(records):
+            if progress_callback is not None and record_idx % progress_interval == 0:
+                progress_callback(record_idx * 100 / num_iterations)
+
+            frame_indices = self.get_indices(record, self.out_fps, self.clip_length)
+            frames = ['img_{:05d}.jpg'.format(idx) for idx in frame_indices]
+
+            identifier = ClipIdentifier(record.path, record_idx, frames)
+
+            if check_content:
+                content_errors.extend([
+                    '{}: does not exist'.format(self.data_dir / frame)
+                    for frame in frames if not check_file_existence(self.data_dir / frame)
+                ])
+
+            annotations.append(ClassificationAnnotation(identifier, record.label))
+
+        return ConverterReturn(annotations, dict(), content_errors)
+
+    @staticmethod
+    def load_annotations(ann_file):
+        return [RawFramesSegmentedRecord(x.strip().split(' ')) for x in read_txt(ann_file)]
+
+    @staticmethod
+    def get_indices(record, output_fps, out_clip_size):
+        time_step = int(round(float(record.fps) / float(output_fps)))
+        if time_step < 1:
+            time_step = 1
+
+        input_length, output_length = time_step * out_clip_size, out_clip_size
+
+        if record.video_num_frames < input_length:
+            indices = [i * time_step + 1 for i in range(record.video_num_frames // time_step)]
+
+            num_rest = output_length - len(indices)
+            if num_rest > 0:
+                num_before = num_rest // 2
+                num_after = num_rest - num_before
+                indices = [indices[0]] * num_before + indices + [indices[-1]] * num_after
+        else:
+            if record.num_frames < input_length:
+                shift_end = min(record.video_end - input_length + 1, record.clip_start + 1)
+                start_pos = shift_end - 1
+            else:
+                shift_start = record.clip_start
+                shift_end = record.clip_end - input_length + 1
+                start_pos = (shift_start + shift_end) // 2
+
+            indices = [start_pos + i * time_step + 1 for i in range(output_length)]
+
+        return indices
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_coco.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_coco.py
index 5c6fccabab6..615e654b1fc 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_coco.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/ms_coco.py
@@ -14,22 +14,40 @@
 limitations under the License.
 """
 
-from tqdm import tqdm
 import numpy as np
 
 from ..config import BoolField, PathField
+from ..logging import print_info
 from ..utils import read_json, convert_bboxes_xywh_to_x1y1x2y2, check_file_existence
 from ..representation import (
     DetectionAnnotation, PoseEstimationAnnotation, CoCoInstanceSegmentationAnnotation, ContainerAnnotation
 )
-from .format_converter import BaseFormatConverter, FileBasedAnnotationConverter, ConverterReturn
+from .format_converter import BaseFormatConverter, FileBasedAnnotationConverter, ConverterReturn, verify_label_map
+
+try:
+    from tqdm import tqdm
+except ImportError:
+    tqdm = None
 
 
 def get_image_annotation(image_id, annotations_):
     return list(filter(lambda x: x['image_id'] == image_id, annotations_))
 
 
-def get_label_map(full_annotation, use_full_label_map=False, has_background=False):
+def get_label_map(dataset_meta, full_annotation, use_full_label_map=False, has_background=False):
+    if dataset_meta:
+        meta = read_json(dataset_meta)
+        label_map = meta.get('label_map')
+        if not label_map:
+            labels = meta.get('labels')
+            label_offset = int(has_background)
+            if labels:
+                label_map = {i + label_offset: label for i, label in enumerate(labels)}
+        if label_map:
+            label_map = verify_label_map(label_map)
+            label_id_to_label = {i: i for i in label_map}
+            return label_map, label_id_to_label
+
     labels = full_annotation['categories']
 
     if not use_full_label_map:
@@ -49,8 +67,8 @@ class MSCocoDetectionConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(description="Path to annotation file in json format."),
             'use_full_label_map': BoolField(
                 optional=True, default=False,
@@ -66,9 +84,12 @@ def parameters(cls):
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.annotation_file = self.get_value_from_config('annotation_file')
@@ -76,6 +97,7 @@ def configure(self):
         self.use_full_label_map = self.get_value_from_config('use_full_label_map')
         self.sort_annotations = self.get_value_from_config('sort_annotations')
         self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         full_annotation = read_json(self.annotation_file)
@@ -85,7 +107,9 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             image_ids.sort(key=lambda value: value[0])
         annotations = full_annotation['annotations']
 
-        label_map, label_id_to_label = get_label_map(full_annotation, self.use_full_label_map, self.has_background)
+        label_map, label_id_to_label = get_label_map(
+            self.dataset_meta, full_annotation, self.use_full_label_map, self.has_background
+        )
 
         meta = {}
         if self.has_background:
@@ -105,8 +129,9 @@ def _create_representations(
         detection_annotations = []
         content_errors = [] if check_content else None
         num_iterations = len(image_info)
+        image_iter = tqdm(enumerate(image_info)) if tqdm is not None else enumerate(image_info)
 
-        for (image_id, image) in tqdm(enumerate(image_info)):
+        for (image_id, image) in image_iter:
             image_labels, xmins, ymins, xmaxs, ymaxs, is_crowd, _ = self._read_image_annotation(
                 image, annotations,
                 label_id_to_label
@@ -118,6 +143,8 @@ def _create_representations(
             detection_annotation = DetectionAnnotation(image[1], image_labels, xmins, ymins, xmaxs, ymaxs)
             detection_annotation.metadata['iscrowd'] = is_crowd
             detection_annotations.append(detection_annotation)
+            if tqdm is None and image_id % progress_interval == 0:
+                print_info('{} / {} processed'.format(image_id, num_iterations))
             if progress_callback is not None and image_id % progress_interval == 0:
                 progress_callback(image_id / num_iterations * 100)
 
@@ -150,6 +177,9 @@ def parameters(cls):
                 'images_dir': PathField(
                     is_directory=True, optional=True,
                     description='path to dataset images, used only for content existence check'
+                ),
+                'dataset_meta_file': PathField(
+                    description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
                 )
             }
         )
@@ -158,6 +188,7 @@ def parameters(cls):
     def configure(self):
         super().configure()
         self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         keypoints_annotations = []
@@ -166,7 +197,7 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         full_annotation = read_json(self.annotation_file)
         image_info = full_annotation['images']
         annotations = full_annotation['annotations']
-        label_map, _ = get_label_map(full_annotation, True)
+        label_map, _ = get_label_map(self.dataset_meta, full_annotation, True)
         num_iterations = len(image_info)
         for image_id, image in enumerate(image_info):
             identifier = image['file_name']
@@ -214,8 +245,9 @@ def _create_representations(
         segmentation_annotations = []
         content_errors = None if not check_content else []
         num_iterations = len(image_info)
+        image_iter = tqdm(enumerate(image_info)) if tqdm is not None else enumerate(image_info)
 
-        for (image_id, image) in tqdm(enumerate(image_info)):
+        for (image_id, image) in image_iter:
             image_labels, _, _, _, _, is_crowd, segmentations = self._read_image_annotation(
                 image, annotations,
                 label_id_to_label
@@ -227,6 +259,9 @@ def _create_representations(
                     content_errors.append('{}: does not exist'.format(image_full_path))
             annotation.metadata['iscrowd'] = is_crowd
             segmentation_annotations.append(annotation)
+            if tqdm is None and image_id % progress_interval == 0:
+                print_info('{} / {} processed'.format(image_id, num_iterations))
+
             if progress_callback is not None and image_id % progress_interval == 0:
                 progress_callback(image_id / num_iterations * 100)
 
@@ -243,8 +278,9 @@ def _create_representations(
         container_annotations = []
         content_errors = None if not check_content else []
         num_iterations = len(image_info)
+        image_iter = tqdm(enumerate(image_info)) if tqdm is not None else enumerate(image_info)
 
-        for (image_id, image) in tqdm(enumerate(image_info)):
+        for (image_id, image) in image_iter:
             image_labels, xmins, ymins, xmaxs, ymaxs, is_crowd, segmentations = self._read_image_annotation(
                 image, annotations,
                 label_id_to_label
@@ -263,7 +299,75 @@ def _create_representations(
                 'segmentation_annotation': segmentation_annotation
             }))
 
+            if tqdm is None and image_id % progress_interval == 0:
+                print_info('{} / {} processed'.format(image_id, num_iterations))
+
             if progress_callback is not None and image_id % progress_interval == 0:
                 progress_callback(image_id / num_iterations * 100)
 
         return container_annotations, content_errors
+
+
+class MSCocoSingleKeypointsConverter(FileBasedAnnotationConverter):
+    __provider__ = 'mscoco_single_keypoints'
+    annotation_types = (PoseEstimationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update(
+            {
+                'images_dir': PathField(
+                    is_directory=True, optional=True,
+                    description='path to dataset images, used only for content existence check'
+                )
+            }
+        )
+        return parameters
+
+    def configure(self):
+        super().configure()
+        self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        keypoints_annotations = []
+        content_errors = []
+
+        full_annotation = read_json(self.annotation_file)
+        image_info = full_annotation['images']
+        annotations = full_annotation['annotations']
+        num_iterations = len(image_info)
+        for image_id, image in enumerate(image_info):
+            identifier = image['file_name']
+            if check_content:
+                full_image_path = self.images_dir / identifier
+                if not check_file_existence(full_image_path):
+                    content_errors.append('{}: does not exist'.format(full_image_path))
+            image_annotation = get_image_annotation(image['id'], annotations)
+            if not image_annotation:
+                continue
+            for target in image_annotation:
+                x_vals, y_vals, visibility, labels, areas, is_crowd, bboxes, difficult = [], [], [], [], [], [], [], []
+                if target['num_keypoints'] == 0:
+                    continue
+                labels.append(target['category_id'])
+                keypoints = target['keypoints']
+                x_vals.append(keypoints[::3])
+                y_vals.append(keypoints[1::3])
+                visibility.append(keypoints[2::3])
+                areas.append(target['area'])
+                bboxes.append(target['bbox'])
+                is_crowd.append(target['iscrowd'])
+                keypoints_annotation = PoseEstimationAnnotation(
+                    identifier, np.array(x_vals), np.array(y_vals), np.array(visibility), np.array(labels)
+                )
+                keypoints_annotation.metadata['areas'] = areas
+                keypoints_annotation.metadata['rects'] = bboxes
+                keypoints_annotation.metadata['iscrowd'] = is_crowd
+                keypoints_annotation.metadata['difficult_boxes'] = difficult
+
+                keypoints_annotations.append(keypoints_annotation)
+                if progress_callback is not None and image_id & progress_interval == 0:
+                    progress_callback(image_id / num_iterations * 100)
+
+        return ConverterReturn(keypoints_annotations, {'label_map': {1: 'person'}}, content_errors)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/ncf_converter.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/ncf_converter.py
index badb74fa03b..a903bec298d 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/ncf_converter.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/ncf_converter.py
@@ -27,8 +27,8 @@ class MovieLensConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'rating_file': PathField(description="Path to rating file."),
             'negative_file': PathField(description="Path to negative file."),
             'users_max_number': NumberField(
@@ -36,7 +36,7 @@ def parameters(cls):
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.rating_file = self.get_value_from_config('rating_file')
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/pascal_voc.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/pascal_voc.py
index 2044e26061c..e536007498e 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/pascal_voc.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/pascal_voc.py
@@ -15,14 +15,13 @@
 """
 
 from pathlib import Path
-from tqdm import tqdm
 
 from ..topology_types import ObjectDetection
 from ..config import PathField, BoolField
 from ..representation import DetectionAnnotation, SegmentationAnnotation
 from ..representation.segmentation_representation import GTMaskLoader
-from ..utils import get_path, read_txt, read_xml, check_file_existence
-from .format_converter import BaseFormatConverter, ConverterReturn
+from ..utils import get_path, read_txt, read_xml, check_file_existence, read_json
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
 
 _VOC_CLASSES_DETECTION = (
     'aeroplane', 'bicycle', 'bird', 'boat',
@@ -43,9 +42,26 @@
 ))
 
 
-def prepare_detection_labels(has_background=True):
-    num_classes = len(_VOC_CLASSES_DETECTION)
+def reverse_label_map(label_map):
+    return {value: key for key, value in label_map.items()}
+
+
+def prepare_detection_labels(dataset_meta, has_background=True):
     labels_shift = 1 if has_background else 0
+    if dataset_meta:
+        meta = read_json(dataset_meta)
+        if 'label_map' in meta:
+            meta['label_map'] = verify_label_map(meta['label_map'])
+            return reverse_label_map(meta['label_map'])
+        if 'labels' in meta:
+            labels = meta['labels']
+            num_classes = len(labels)
+            reversed_label_map = dict(zip(labels, list(range(labels_shift, num_classes + labels_shift))))
+            if has_background:
+                reversed_label_map['__background__'] = 0
+            return reversed_label_map
+
+    num_classes = len(_VOC_CLASSES_DETECTION)
     reversed_label_map = dict(zip(_VOC_CLASSES_DETECTION, list(range(labels_shift, num_classes + labels_shift))))
     if has_background:
         reversed_label_map['__background__'] = 0
@@ -53,18 +69,14 @@ def prepare_detection_labels(has_background=True):
     return reversed_label_map
 
 
-def reverse_label_map(label_map):
-    return {value: key for key, value in label_map.items()}
-
-
 class PascalVOCSegmentationConverter(BaseFormatConverter):
     __provider__ = 'voc_segmentation'
     annotation_types = (SegmentationAnnotation, )
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'imageset_file': PathField(description="Path to file with validation image list."),
             'images_dir': PathField(
                 optional=True, is_directory=True,
@@ -74,14 +86,19 @@ def parameters(cls):
                 optional=True, is_directory=True,
                 description="Path to directory with ground truth segmentation masks related to devkit root "
                             "(default SegmentationClass)."
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.image_set_file = self.get_value_from_config('imageset_file')
         self.image_dir = self.get_value_from_config('images_dir')
+        dataset_meta_file = self.get_value_from_config('dataset_meta_file')
+        self.dataset_meta = {} if not dataset_meta_file else read_json(dataset_meta_file)
         if not self.image_dir:
             self.image_dir = get_path(self.image_set_file.parents[-2] / 'JPEGImages', is_directory=True)
 
@@ -114,9 +131,9 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
                 progress_callback(image_id / num_iterations * 100)
 
         meta = {
-            'label_map': dict(enumerate(_VOC_CLASSES_SEGMENTATION)),
+            'label_map': self.dataset_meta.get('label_map', dict(enumerate(_VOC_CLASSES_SEGMENTATION))),
             'background_label': 0,
-            'segmentation_colors': _SEGMENTATION_COLORS
+            'segmentation_colors': self.dataset_meta.get('segmentation_colors', _SEGMENTATION_COLORS)
         }
 
         return ConverterReturn(annotations, meta, content_check_errors)
@@ -139,6 +156,9 @@ def parameters(cls):
             ),
             'has_background': BoolField(
                 optional=True, default=True, description="Allows convert dataset with/without adding background_label."
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
         return parameters
@@ -150,15 +170,16 @@ def configure(self):
             self.image_dir = get_path(self.image_set_file.parents[-2] / 'JPEGImages')
         self.annotations_dir = self.get_value_from_config('annotations_dir')
         self.has_background = self.get_value_from_config('has_background')
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
-        class_to_ind = prepare_detection_labels(self.has_background)
+        class_to_ind = prepare_detection_labels(self.dataset_meta, self.has_background)
         content_check_errors = [] if check_content else None
 
         detections = []
         image_set = read_txt(self.image_set_file, sep=None)
         num_iterations = len(image_set)
-        for (image_id, image) in tqdm(enumerate(image_set)):
+        for (image_id, image) in enumerate(image_set):
             root = read_xml(self.annotations_dir / '{}.xml'.format(image))
 
             identifier = root.find('.//filename').text
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/sample_converter.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/sample_converter.py
index 8018ecb6918..fc9ce014b0f 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/sample_converter.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/sample_converter.py
@@ -35,11 +35,12 @@ class SampleConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'data_dir': PathField(is_directory=True, description="Path to sample dataset root directory.")
         })
-        return parameters
+
+        return configuration_parameters
 
     def configure(self):
         """
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/squad.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/squad.py
new file mode 100644
index 00000000000..5f335636146
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/squad.py
@@ -0,0 +1,194 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from collections import namedtuple
+
+import numpy as np
+
+from ..representation import QuestionAnsweringAnnotation
+from ..utils import read_json
+from ..config import PathField, NumberField, BoolField
+
+from .format_converter import BaseFormatConverter, ConverterReturn
+from ._nlp_common import get_tokenizer, CLS_ID, SEP_ID
+
+
+class SQUADConverter(BaseFormatConverter):
+    __provider__ = "squad"
+    annotation_types = (QuestionAnsweringAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
+            'testing_file': PathField(description="Path to testing file."),
+            'vocab_file': PathField(description='Path to vocabulary file.', optional=True),
+            'sentence_piece_model_file': PathField(description='sentence piece model for tokenization', optional=True),
+            'max_seq_length': NumberField(
+                description='The maximum total input sequence length after WordPiece tokenization.',
+                optional=True, default=128
+            ),
+            'max_query_length': NumberField(
+                description='The maximum number of tokens for the question.',
+                optional=True, default=64
+            ),
+            'doc_stride': NumberField(
+                description="When splitting up a long document into chunks, how much stride to take between chunks.",
+                optional=True, default=128
+            ),
+            'lower_case': BoolField(optional=True, default=False, description='Switch tokens to lower case register')
+        })
+
+        return configuration_parameters
+
+    def configure(self):
+        self.testing_file = self.get_value_from_config('testing_file')
+        self.max_seq_length = self.get_value_from_config('max_seq_length')
+        self.max_query_length = self.get_value_from_config('max_query_length')
+        self.doc_stride = self.get_value_from_config('doc_stride')
+        self.lower_case = self.get_value_from_config('lower_case')
+        self.tokenizer = get_tokenizer(self.config, self.lower_case)
+        self.support_vocab = 'vocab_file' in self.config
+
+    @staticmethod
+    def _load_examples(file):
+        def _is_whitespace(c):
+            if c == " " or c == "\t" or c == "\r" or c == "\n" or ord(c) == 0x202F:
+                return True
+            return False
+
+        examples = []
+        answers = []
+        data = read_json(file)['data']
+
+        for entry in data:
+            for paragraph in entry['paragraphs']:
+                paragraph_text = paragraph["context"]
+                doc_tokens = []
+                char_to_word_offset = []
+                prev_is_whitespace = True
+                for c in paragraph_text:
+                    if _is_whitespace(c):
+                        prev_is_whitespace = True
+                    else:
+                        if prev_is_whitespace:
+                            doc_tokens.append(c)
+                        else:
+                            doc_tokens[-1] += c
+                        prev_is_whitespace = False
+                    char_to_word_offset.append(len(doc_tokens) - 1)
+
+                for qa in paragraph["qas"]:
+                    qas_id = qa["id"]
+                    question_text = qa["question"]
+                    orig_answer_text = qa["answers"]
+                    is_impossible = False
+
+                    example = {
+                        'id': qas_id,
+                        'question_text': question_text,
+                        'tokens': doc_tokens,
+                        'is_impossible': is_impossible
+                    }
+                    examples.append(example)
+                    answers.append(orig_answer_text)
+        return examples, answers
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        examples, answers = self._load_examples(self.testing_file)
+        annotations = []
+        unique_id = 1000000000
+        DocSpan = namedtuple("DocSpan", ["start", "length"])
+
+        for (example_index, example) in enumerate(examples):
+            query_tokens = self.tokenizer.tokenize(example['question_text'])
+            if len(query_tokens) > self.max_query_length:
+                query_tokens = query_tokens[:self.max_query_length]
+            all_doc_tokens = []
+            for (i, token) in enumerate(example['tokens']):
+                sub_tokens = self.tokenizer.tokenize(token)
+                for sub_token in sub_tokens:
+                    all_doc_tokens.append(sub_token)
+            max_tokens_for_doc = self.max_seq_length - len(query_tokens) - 3
+            doc_spans = []
+            start_offset = 0
+            while start_offset < len(all_doc_tokens):
+                length = len(all_doc_tokens) - start_offset
+                if length > max_tokens_for_doc:
+                    length = max_tokens_for_doc
+                doc_spans.append(DocSpan(start_offset, length))
+                if start_offset + length == len(all_doc_tokens):
+                    break
+                start_offset += min(length, self.doc_stride)
+
+            for idx, doc_span in enumerate(doc_spans):
+                tokens = []
+                segment_ids = []
+                tokens.append("[CLS]" if self.support_vocab else CLS_ID)
+                segment_ids.append(0)
+                for token in query_tokens:
+                    tokens.append(token)
+                    segment_ids.append(0)
+                tokens.append("[SEP]" if self.support_vocab else SEP_ID)
+                segment_ids.append(0)
+
+                for i in range(doc_span.length):
+                    split_token_index = doc_span.start + i
+                    tokens.append(all_doc_tokens[split_token_index])
+                    segment_ids.append(1)
+                tokens.append("[SEP]" if self.support_vocab else SEP_ID)
+                segment_ids.append(1)
+                input_ids = self.tokenizer.convert_tokens_to_ids(tokens) if self.support_vocab else tokens
+                input_mask = [1] * len(input_ids)
+
+                while len(input_ids) < self.max_seq_length:
+                    input_ids.append(0)
+                    input_mask.append(0)
+                    segment_ids.append(0)
+
+                # add index to make identifier unique
+                identifier = ['input_ids_{}'.format(idx), 'input_mask_{}'.format(idx), 'segment_ids_{}'.format(idx)]
+                annotation = QuestionAnsweringAnnotation(
+                    identifier,
+                    np.array(unique_id),
+                    np.array(input_ids),
+                    np.array(input_mask),
+                    np.array(segment_ids),
+                    tokens,
+                    answers[example_index],
+                )
+                annotations.append(annotation)
+                unique_id += 1
+        return ConverterReturn(annotations, None, None)
+
+    @staticmethod
+    def _is_max_context(doc_spans, cur_span_index, position):
+        best_score = None
+        best_span_index = None
+        for (span_index, doc_span) in enumerate(doc_spans):
+            end = doc_span.start + doc_span.length - 1
+            if position < doc_span.start:
+                continue
+            if position > end:
+                continue
+            num_left_context = position - doc_span.start
+            num_right_context = end - position
+            score = min(num_left_context, num_right_context) + 0.01 * doc_span.length
+            if best_score is None or score > best_score:
+                best_score = score
+                best_span_index = span_index
+
+        return cur_span_index == best_span_index
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/super_resolution_converter.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/super_resolution_converter.py
index 1f4328d0387..389f22ac80b 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/super_resolution_converter.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/super_resolution_converter.py
@@ -15,11 +15,13 @@
 """
 
 import cv2
+import numpy as np
 from ..config import PathField, StringField, BoolField, ConfigError, NumberField
 from ..representation import SuperResolutionAnnotation
 from ..representation.super_resolution_representation import GTLoader
+from ..utils import check_file_existence
+from ..data_readers import MultiFramesInputIdentifier
 from .format_converter import BaseFormatConverter, ConverterReturn
-from  ..utils import check_file_existence
 
 LOADERS_MAPPING = {
     'opencv': GTLoader.OPENCV,
@@ -33,8 +35,8 @@ class SRConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'data_dir': PathField(
                 is_directory=True, description="Path to folder, where images in low and high resolution are located."
             ),
@@ -62,7 +64,7 @@ def parameters(cls):
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.data_dir = self.get_value_from_config('data_dir')
@@ -95,7 +97,7 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
                 if not check_file_existence(self.data_dir / hr_file_name):
                     content_errors.append('{}: does not exist'.format(self.data_dir / hr_file_name))
                 if self.two_streams and not check_file_existence(self.data_dir / upsampled_file_name):
-                    content_errors.append('{}: does not exist'.format(self.data_dir / hr_file_name))
+                    content_errors.append('{}: does not exist'.format(self.data_dir / upsampled_file_name))
 
             identifier = [lr_file_name, upsampled_file_name] if self.two_streams else lr_file_name
             annotation.append(SuperResolutionAnnotation(identifier, hr_file_name, gt_loader=self.annotation_loader))
@@ -109,3 +111,71 @@ def generate_upsample_file(original_image_path, scale_factor, upsampled_file_nam
         image = cv2.imread(str(original_image_path))
         upsampled_image = cv2.resize(image, None, fx=scale_factor, fy=scale_factor, interpolation=cv2.INTER_CUBIC)
         cv2.imwrite(str(original_image_path.parent / upsampled_file_name), upsampled_image)
+
+
+class SRMultiFrameConverter(BaseFormatConverter):
+    __provider__ = 'multi_frame_super_resolution'
+    annotation_types = (SuperResolutionAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'data_dir': PathField(
+                is_directory=True, description="Path to folder, where images in low and high resolution are located."
+            ),
+            'lr_suffix': StringField(
+                optional=True, default="lr", description="Low resolution file name's suffix."
+            ),
+            'hr_suffix': StringField(
+                optional=True, default="hr", description="High resolution file name's suffix."
+            ),
+            'number_input_frames': NumberField(
+                description='number inputs per inference', value_type=int,
+            ),
+            'annotation_loader': StringField(
+                optional=True, choices=LOADERS_MAPPING.keys(), default='pillow',
+                description="Which library will be used for ground truth image reading. "
+                            "Supported: {}".format(', '.join(LOADERS_MAPPING.keys()))
+            )
+        })
+        return params
+
+    def configure(self):
+        self.data_dir = self.get_value_from_config('data_dir')
+        self.lr_suffix = self.get_value_from_config('lr_suffix')
+        self.hr_suffix = self.get_value_from_config('hr_suffix')
+        self.annotation_loader = LOADERS_MAPPING.get(self.get_value_from_config('annotation_loader'))
+        self.num_frames = self.get_value_from_config('number_input_frames')
+        self.max_frame_id = self.get_value_from_config('max_frame_id')
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        content_errors = [] if check_content else None
+        frames_ids = []
+        frame_names = []
+        annotations = []
+        for file_in_dir in self.data_dir.iterdir():
+            image_name = file_in_dir.parts[-1]
+            if self.lr_suffix in image_name and self.hr_suffix not in image_name:
+                frame_names.append(image_name)
+                frames_ids.append(int(image_name.split(self.lr_suffix)[0]))
+        sorted_frames = np.argsort(frames_ids)
+        frames_ids.sort()
+        sorted_frame_names = [frame_names[idx] for idx in sorted_frames]
+
+        num_iterations = len(frames_ids)
+        for idx, _ in enumerate(frames_ids):
+            if len(frames_ids) - idx < self.num_frames:
+                break
+            input_ids = list(range(self.num_frames))
+            input_frames = [sorted_frame_names[idx + shift] for shift in input_ids]
+            hr_name = self.hr_suffix.join(input_frames[0].split(self.lr_suffix))
+            if check_content and not check_file_existence(self.data_dir / hr_name):
+                content_errors.append('{}: does not exist'.format(self.data_dir / hr_name))
+            annotations.append(SuperResolutionAnnotation(
+                MultiFramesInputIdentifier(input_ids, input_frames), hr_name, gt_loader=self.annotation_loader
+            ))
+            if progress_callback and idx % progress_interval == 0:
+                progress_callback(idx * 100 / num_iterations)
+
+        return ConverterReturn(annotations, None, content_errors)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/text_classification.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/text_classification.py
new file mode 100644
index 00000000000..64457b55f56
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/text_classification.py
@@ -0,0 +1,337 @@
+from collections import namedtuple
+import csv
+import numpy as np
+try:
+    import tensorflow as tf
+except ImportError:
+    tf = None
+
+
+from ..config import PathField, StringField, NumberField, BoolField, ConfigError
+from ..representation import TextClassificationAnnotation
+from ..utils import string_to_list
+from .format_converter import BaseFormatConverter, ConverterReturn
+from ._nlp_common import get_tokenizer, truncate_seq_pair, SEG_ID_A, SEG_ID_B, SEP_ID, CLS_ID, SEG_ID_CLS, SEG_ID_PAD
+
+
+InputExample = namedtuple('InputExample', ['guid', 'text_a', 'text_b', 'label'])
+labels = {
+    'xnli': ["contradiction", "entailment", "neutral"],
+    'mnli': ["contradiction", "entailment", "neutral"],
+    'imdb': ['neg', 'pos'],
+    'mrpc': ['0', '1'],
+    'cola': ['0', '1']
+}
+
+
+class BaseGLUETextClassificationConverter(BaseFormatConverter):
+    annotation_types = (TextClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'annotation_file': PathField(description='path to annotation file in json or tsv format'),
+            'vocab_file': PathField(description='Path to vocabulary file for word piece tokenizer', optional=True),
+            'sentence_piece_model_file': PathField(description='sentence piece model for tokenization', optional=True),
+            'max_seq_length': NumberField(
+                description='The maximum total input sequence length after tokenization.',
+                optional=True, default=128
+            ),
+            'lower_case': BoolField(optional=True, default=False, description='Switch tokens to lower case register')
+        })
+
+        return params
+
+    def configure(self):
+        self.annotation_file = self.get_value_from_config('annotation_file')
+        self.max_seq_length = self.get_value_from_config('max_seq_length')
+        self.lower_case = self.get_value_from_config('lower_case')
+        self.tokenizer = get_tokenizer(self.config, self.lower_case)
+        self.reversed_label_map = {value: key for key, value in self.label_map.items()}
+        self.support_vocab = 'vocab_file' in self.config
+
+    def read_tsv(self):
+        lines = []
+        with self.annotation_file.open('r') as ann_file:
+            reader = csv.reader(ann_file, delimiter="\t", quotechar=None)
+            for idx, line in enumerate(reader):
+                if idx == 0:
+                    continue
+                guid = "dev-{}".format(idx)
+                label = self.reversed_label_map[line[self.label_ind]]
+                text_a = line[self.text_a_ind]
+                text_b = line[self.text_b_ind] if self.text_b_ind is not None else None
+                lines.append(InputExample(guid, text_a, text_b, label))
+
+        return lines
+
+    def convert_single_example(self, example):
+        identifier = [
+            'input_ids_{}'.format(example.guid),
+            'input_mask_{}'.format(example.guid),
+            'segment_ids_{}'.format(example.guid)
+        ]
+        tokens_a = self.tokenizer.tokenize(example.text_a)
+        tokens_b = None
+        if example.text_b:
+            tokens_b = self.tokenizer.tokenize(example.text_b if example.text_b is not None else '')
+
+        if tokens_b:
+            # Modifies `tokens_a` and `tokens_b` in place so that the total
+            # length is less than the specified length.
+            # Account for two [SEP] & one [CLS] with "- 3"
+            truncate_seq_pair(tokens_a, tokens_b, max_seq_length - 3)
+        else:
+            # Account for one [SEP] & one [CLS] with "- 2"
+            if len(tokens_a) > self.max_seq_length - 2:
+                tokens_a = tokens_a[:self.max_seq_length - 2]
+
+        tokens = []
+        segment_ids = []
+        for token in tokens_a:
+            tokens.append(token)
+            segment_ids.append(SEG_ID_A)
+        tokens.append('[SEP]' if self.support_vocab else SEP_ID)
+        segment_ids.append(SEG_ID_A)
+
+        if tokens_b:
+            for token in tokens_b:
+                tokens.append(token)
+                segment_ids.append(SEG_ID_B)
+            tokens.append('[SEP]' if self.support_vocab else SEP_ID)
+            segment_ids.append(SEG_ID_B)
+
+        tokens.append("[CLS]" if self.support_vocab else CLS_ID)
+        segment_ids.append(SEG_ID_CLS)
+
+        input_ids = self.tokenizer.convert_tokens_to_ids(tokens) if self.support_vocab else tokens
+
+        # The mask has 0 for real tokens and 1 for padding tokens. Only real
+        # tokens are attended to.
+        input_mask = [0] * len(input_ids)
+
+        # Zero-pad up to the sequence length.
+        if len(input_ids) < self.max_seq_length:
+            delta_len = self.max_seq_length - len(input_ids)
+            input_ids = [0] * delta_len + input_ids
+            input_mask = [1] * delta_len + input_mask
+            segment_ids = [SEG_ID_PAD] * delta_len + segment_ids
+
+        return TextClassificationAnnotation(
+            identifier, example.label, np.array(input_ids), np.array(input_mask), np.array(segment_ids), tokens
+        )
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        examples = self.read_tsv()
+        annotations = []
+        num_iter = len(examples)
+        for example_id, example in enumerate(examples):
+            annotations.append(self.convert_single_example(example))
+            if progress_callback and example_id % progress_interval == 0:
+                progress_callback(example_id * 100 / num_iter)
+
+        return ConverterReturn(annotations, {'label_map': self.label_map}, None)
+
+
+class XNLIDatasetConverter(BaseGLUETextClassificationConverter):
+    __provider__ = 'xnli'
+
+    def __init__(self, config):
+        self.label_map = dict(enumerate(labels['xnli']))
+        self.label_ind = 1
+        self.text_a_ind = 6
+        self.text_b_ind = 7
+        self.lang_ind = 0
+        super().__init__(config)
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'language_filter': StringField(
+                description='comma-separated list of languages for selection only appropriate annotations.'
+                'If not provided full dataset used',
+                optional=True
+                )
+        })
+
+        return params
+
+    def configure(self):
+        super().configure()
+        self.language_filter = self.get_value_from_config('language_filter')
+        if self.language_filter is not None:
+            self.language_filter = string_to_list(self.language_filter)
+
+    def read_tsv(self):
+        lines = []
+        with self.annotation_file.open('r') as ann_file:
+            reader = csv.reader(ann_file, delimiter="\t", quotechar=None)
+            for idx, line in enumerate(reader):
+                if idx == 0:
+                    continue
+                guid = "dev-{}".format(idx)
+                language = line[self.lang_ind]
+                if self.language_filter and language not in self.language_filter:
+                    continue
+                label = self.reversed_label_map[line[self.label_ind]]
+                text_a = line[self.text_a_ind]
+                text_b = line[self.text_b_ind]
+                lines.append(InputExample(guid, text_a, text_b, label))
+
+        return lines
+
+
+class MNLIDatasetConverter(BaseGLUETextClassificationConverter):
+    __provider__ = 'mnli'
+
+    def __init__(self, config):
+        self.label_map = dict(enumerate(labels['mnli']))
+        self.label_ind = -1
+        self.text_a_ind = 6
+        self.text_b_ind = 7
+        super().__init__(config)
+
+
+class BertTextClassificationTFRecordConverter(BaseFormatConverter):
+    __provider__ = 'bert_tf_record'
+    annotation_types = (TextClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.update({
+            'annotation_file': PathField(description='path to predict.tf_record format'),
+        })
+
+        return params
+
+    def configure(self):
+        if tf is None:
+            raise ConfigError(
+                'bert_tf_record converter requires TensorFlow installation. Please install it first.'
+            )
+        self.annotation_file = self.get_value_from_config('annotation_file')
+
+    def read_tf_record(self):
+        record_iterator = tf.python_io.tf_record_iterator(path=str(self.annotation_file))
+        record_list = []
+        for string_record in record_iterator:
+            example = tf.train.Example()
+            example.ParseFromString(string_record)
+            input_ids = example.features.feature['input_ids'].int64_list.value
+            input_mask = example.features.feature['input_mask'].int64_list.value
+            label_ids = example.features.feature['label_ids'].int64_list.value
+            segment_ids = example.features.feature['segment_ids'].int64_list.value
+            record_list.append([input_ids, input_mask, segment_ids, label_ids])
+        return record_list
+
+    @staticmethod
+    def convert_single_example(example, guid):
+        identifier = [
+            'input_ids_{}'.format(guid),
+            'input_mask_{}'.format(guid),
+            'segment_ids_{}'.format(guid)
+        ]
+
+        return TextClassificationAnnotation(
+            identifier, np.array(example[3]), np.array(example[0]), np.array(example[1]), np.array(example[2]), None
+        )
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        examples = self.read_tf_record()
+        annotations = []
+        num_iter = len(examples)
+
+        for idx, example in enumerate(examples):
+            annotations.append(self.convert_single_example(example, idx))
+            if progress_callback and idx % progress_interval == 0:
+                progress_callback(idx * 100 / num_iter)
+
+        return ConverterReturn(annotations, None, None)
+
+
+class BertXNLITFRecordConverter(BertTextClassificationTFRecordConverter):
+    __provider__ = 'bert_xnli_tf_record'
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        annotations, _, errors = super().convert(check_content, progress_callback, progress_interval, **kwargs)
+
+        return ConverterReturn(annotations, {'label_map':  dict(enumerate(labels['xnli']))}, errors)
+
+
+class MRPCConverter(BaseGLUETextClassificationConverter):
+    __provider__ = 'mrpc'
+
+    def __init__(self, config):
+        self.label_map = dict(enumerate(labels['mrpc']))
+        self.label_ind = 0
+        self.text_a_ind = 3
+        self.tex_b_ind = 4
+        super().__init__(config)
+
+
+class CoLAConverter(BaseGLUETextClassificationConverter):
+    __provider__ = 'cola'
+
+    def __init__(self, config):
+        self.label_map = dict(enumerate(labels['cola']))
+        self.label_ind = 1
+        self.text_a_ind = 3
+        self.text_b_ind = None
+        super().__init__(config)
+
+
+class IMDBConverter(BaseGLUETextClassificationConverter):
+    __provider__ = 'imdb'
+    annotation_types = (TextClassificationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        params = super().parameters()
+        params.pop('annotation_file')
+        params.update({
+            'data_dir': PathField(is_directory=True, description='path to directory  with annotation samples'),
+            'vocab_file': PathField(description='Path to vocabulary file for word piece tokenizer', optional=True),
+            'sentence_piece_model_file': PathField(description='sentence piece model for tokenization', optional=True),
+            'max_seq_length': NumberField(
+                description='The maximum total input sequence length after tokenization.',
+                optional=True, default=128
+            ),
+            'lower_case': BoolField(optional=True, default=False, description='Switch tokens to lower case register')
+        })
+
+        return params
+
+    def configure(self):
+        self.data_dir = self.get_value_from_config('data_dir')
+        self.max_seq_length = self.get_value_from_config('max_seq_length')
+        self.lower_case = self.get_value_from_config('lower_case')
+        self.tokenizer = get_tokenizer(self.config, self.lower_case)
+        imdb_labels = labels['imdb']
+        self.label_map = dict(enumerate(imdb_labels))
+        self.reversed_label_map = {value: key for key, value in self.label_map.items()}
+        self.support_vocab = 'vocab_file' in self.config
+
+    def _create_examples(self):
+        examples = []
+        for label in labels['imdb']:
+            cur_dir = self.data_dir / label
+            for guid, filename in enumerate(cur_dir.glob('*.txt')):
+                with filename.open() as f:
+                    text = f.read().strip().replace("<br />", " ")
+                examples.append(InputExample(
+                    guid=guid, text_a=text, text_b=None, label=self.reversed_label_map[label]))
+        return examples
+
+    def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
+        examples = self._create_examples()
+        annotations = []
+        num_iter = len(examples)
+        for example_id, example in enumerate(examples):
+            annotations.append(self.convert_single_example(example))
+            if progress_callback and example_id % progress_interval == 0:
+                progress_callback(example_id * 100 / num_iter)
+
+        return ConverterReturn(annotations, {'label_map': self.label_map}, None)
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/vgg_face_regression.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/vgg_face_regression.py
index a41155cfc37..3bd70b70100 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/vgg_face_regression.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/vgg_face_regression.py
@@ -29,8 +29,8 @@ class VGGFaceRegressionConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'landmarks_csv_file': PathField(description="Path to csv file with coordinates of landmarks points."),
             'bbox_csv_file': PathField(
                 optional=True, description="Path to cvs file which contains bounding box coordinates for faces."
@@ -41,7 +41,7 @@ def parameters(cls):
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.landmarks_csv = self.get_value_from_config('landmarks_csv_file')
@@ -76,7 +76,7 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
         if self.bbox_csv:
             for index, row in enumerate(read_csv(self.bbox_csv)):
                 annotations[index].metadata['rect'] = convert_bboxes_xywh_to_x1y1x2y2(
-                    int(row["X"]), int(row["Y"]), int(row["W"]), int(row["H"])
+                    max(int(row["X"]), 0), max(int(row["Y"]), 0), max(int(row["W"]), 0), max(int(row["H"]), 0)
                 )
 
         meta = {
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/wider.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/wider.py
index 6b2f2796383..18b58046405 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/wider.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/wider.py
@@ -16,9 +16,9 @@
 
 from ..config import NumberField, PathField
 from ..representation import DetectionAnnotation
-from ..utils import convert_bboxes_xywh_to_x1y1x2y2, read_txt, check_file_existence
+from ..utils import convert_bboxes_xywh_to_x1y1x2y2, read_txt, check_file_existence, read_json
 
-from .format_converter import BaseFormatConverter, ConverterReturn
+from .format_converter import BaseFormatConverter, ConverterReturn, verify_label_map
 
 
 class WiderFormatConverter(BaseFormatConverter):
@@ -27,8 +27,8 @@ class WiderFormatConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        configuration_parameters = super().parameters()
+        configuration_parameters.update({
             'annotation_file': PathField(
                 description="Path to xml file, which contains ground truth data in WiderFace dataset format."
             ),
@@ -40,23 +40,25 @@ def parameters(cls):
             'images_dir': PathField(
                 is_directory=True, optional=True,
                 description='path to dataset images, used only for content existence check'
+            ),
+            'dataset_meta_file': PathField(
+                description='path to json file with dataset meta (e.g. label_map, color_encoding)', optional=True
             )
         })
 
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.annotation_file = self.get_value_from_config('annotation_file')
         self.label_start = self.get_value_from_config('label_start')
         self.images_dir = self.get_value_from_config('images_dir') or self.annotation_file.parent
+        self.dataset_meta = self.get_value_from_config('dataset_meta_file')
 
     def convert(self, check_content=False, progress_callback=None, progress_interval=100, **kwargs):
         image_annotations = read_txt(self.annotation_file)
         content_errors = None if not check_content else []
-        image_ids = []
-        for image_id, line in enumerate(image_annotations):
-            if '.jpg' in line:
-                image_ids.append(image_id)
+        image_ids = [image_id for image_id, line in enumerate(image_annotations) if '.jpg' in line]
+        meta = self.generate_meta()
 
         annotations = []
         num_iterations = len(image_ids)
@@ -84,6 +86,30 @@ def convert(self, check_content=False, progress_callback=None, progress_interval
             if progress_callback and index % progress_interval == 0:
                 progress_callback(index * 100 / num_iterations)
 
-        meta = {'label_map': {0: '__background__', self.label_start: 'face'}, 'background_label': 0}
-
         return ConverterReturn(annotations, meta, content_errors)
+
+    def generate_meta(self):
+        if not self.dataset_meta:
+            if self.label_start != 0:
+                return {'label_map': {0: '__background__', self.label_start: 'face'}, 'background_label': 0}
+            return {'label_map': {self.label_start: 'face'}}
+        dataset_meta = read_json(self.dataset_meta)
+        background_label = dataset_meta.get('background_label', -1)
+        labels = dataset_meta.get('labels')
+        label_map = {0: '__background__', self.label_start: 'face'}
+        if labels:
+            label_map = {
+                label_id + self.label_start if label not in ('background', '__background__') else 0: label
+                for label_id, label in enumerate(labels)
+            }
+            label_map[background_label] = '__background__'
+
+        label_map = verify_label_map(dataset_meta.get('label_map', label_map))
+        valid_labels = [key for key in label_map if key != background_label]
+        self.background_label = background_label
+        self.label_start = sorted(valid_labels)[0]
+        meta = {'label_map': label_map}
+        if background_label != -1:
+            meta['background_label'] = background_label
+
+        return meta
diff --git a/tools/accuracy_checker/accuracy_checker/annotation_converters/wmt.py b/tools/accuracy_checker/accuracy_checker/annotation_converters/wmt.py
index 74c5c1645b0..ca720e4babc 100644
--- a/tools/accuracy_checker/accuracy_checker/annotation_converters/wmt.py
+++ b/tools/accuracy_checker/accuracy_checker/annotation_converters/wmt.py
@@ -21,14 +21,14 @@ class WMTConverter(BaseFormatConverter):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update(
+        configuration_parameters = super().parameters()
+        configuration_parameters.update(
             {
                 'input_file': PathField(description='path to input file'),
                 'reference_file': PathField(description='path to file with reference for translation')
             }
         )
-        return parameters
+        return configuration_parameters
 
     def configure(self):
         self.input_file = self.get_value_from_config('input_file')
diff --git a/tools/accuracy_checker/accuracy_checker/config/config_reader.py b/tools/accuracy_checker/accuracy_checker/config/config_reader.py
index 931b13ab907..6af6e1c7903 100644
--- a/tools/accuracy_checker/accuracy_checker/config/config_reader.py
+++ b/tools/accuracy_checker/accuracy_checker/config/config_reader.py
@@ -16,6 +16,7 @@
 
 import copy
 from pathlib import Path
+import os
 
 import warnings
 
@@ -26,6 +27,7 @@
     'launchers': {
         'model': 'models',
         'weights': 'models',
+        'color_coeff': 'models',
         'caffe_model': 'models',
         'caffe_weights': 'models',
         'tf_model': 'models',
@@ -36,7 +38,8 @@
         'cpu_extensions': 'extensions',
         'gpu_extensions': 'extensions',
         'bitstream': 'bitstreams',
-        'affinity_map': 'affinity_map'
+        'affinity_map': 'affinity_map',
+        'predictions': 'source'
     },
     'datasets': {
         'segmentation_masks_source': 'source',
@@ -46,6 +49,16 @@
     },
 }
 
+COMMAND_LINE_ARGS_AS_ENV_VARS = {
+    'source': 'DATA_DIR',
+    'annotations': 'ANNOTATIONS_DIR',
+    'bitstreams': 'BITSTREAMS_DIR',
+    'models': 'MODELS_DIR',
+    'extensions': 'EXTENSIONS_DIR',
+}
+DEFINITION_ENV_VAR = 'DEFINITIONS_FILE'
+CONFIG_SHARED_PARAMETERS = ['bitstream']
+
 
 class ConfigReader:
     """
@@ -77,14 +90,19 @@ def merge(arguments):
     def process_config(config, mode='models', arguments=None):
         if arguments is None:
             arguments = dict()
-        ConfigReader._provide_cmd_arguments(arguments, config, mode)
         ConfigReader._merge_paths_with_prefixes(arguments, config, mode)
+        ConfigReader._provide_cmd_arguments(arguments, config, mode)
         ConfigReader._filter_launchers(config, arguments, mode)
+        ConfigReader._separate_evaluations(config, mode)
+        ConfigReader._previous_configuration_parameters_sharing(config, mode)
 
     @staticmethod
     def _read_configs(arguments):
-        global_config = read_yaml(arguments.definitions) if arguments.definitions else None
         local_config = read_yaml(arguments.config)
+        definitions = os.environ.get(DEFINITION_ENV_VAR) or local_config.get('global_definitions')
+        if definitions:
+            definitions = read_yaml(Path(arguments.config).parent / definitions)
+        global_config = read_yaml(arguments.definitions) if arguments.definitions else definitions
 
         return global_config, local_config
 
@@ -104,9 +122,8 @@ def _check_models_config(config):
             for model in models:
                 if _is_requirements_missed(model, required_model_entries):
                     raise ConfigError('Each model must specify {}'.format(', '.join(required_model_entries)))
-
-                if list(filter(lambda entry: _is_requirements_missed(entry, required_dataset_entries),
-                               model['datasets'])):
+                datasets = model['datasets'].values() if isinstance(model['datasets'], dict) else model['datasets']
+                if list(filter(lambda entry: _is_requirements_missed(entry, required_dataset_entries), datasets)):
                     raise ConfigError(required_dataset_error.format(model['name'], ', '.join(required_dataset_entries)))
 
         def _check_pipelines_config(config):
@@ -138,12 +155,33 @@ def _count_entry(stages, entry):
                 if not count_metrics:
                     raise ConfigError('Metrics are not specified')
 
-        if 'pipelines' in config:
-            _check_pipelines_config(config)
-            return 'pipelines'
+        def _check_module_config(config):
+            required_entries = ['name', 'module']
+            evaluations = config['evaluations']
+            if not evaluations:
+                raise ConfigError('Missed "{}" in local config'.format('evaluations'))
+            for evaluation in evaluations:
+                if _is_requirements_missed(evaluation, required_entries):
+                    raise ConfigError('Each evaluations must specify {}'.format(', '.join(required_entries)))
+
+        config_checkers = {
+            'evaluations': _check_module_config,
+            'models': _check_models_config,
+            'pipelines': _check_pipelines_config,
+        }
+
+        if not isinstance(config, dict):
+            raise ConfigError('local config should has dictionary based structure')
+
+        eval_mode = get_mode(config)
+        config_checker_func = config_checkers.get(eval_mode)
+        if config_checker_func is None:
+            raise ConfigError('Accuracy Checker {} mode is not supported. Please select between {}'. format(
+                eval_mode, ', '.join(['evaluations', 'models', 'pipelines'])
+            ))
+        config_checker_func(config)
 
-        _check_models_config(config)
-        return 'models'
+        return eval_mode
 
     @staticmethod
     def _prepare_global_configs(global_configs):
@@ -169,59 +207,87 @@ def merge(local_entries, global_entries, identifier):
             merge(dataset.get('postprocessing'), global_configs.get('postprocessing'), 'type')
 
     @staticmethod
-    def _merge_configs(global_configs, local_config, arguments, mode='models'):
-        def _merge_models_config(global_configs, local_config, arguments):
-            config = copy.deepcopy(local_config)
-            if not global_configs:
-                return config
+    def _merge_models_config(global_configs, local_config, arguments):
+        config = copy.deepcopy(local_config)
+        if not global_configs:
+            return config
 
-            models = config.get('models')
-            for model in models:
-                if 'launchers' in global_configs:
-                    for i, launcher_entry in enumerate(model['launchers']):
-                        model['launchers'][i] = ConfigReader._merge_configs_by_identifier(
-                            global_configs['launchers'], launcher_entry, 'framework'
-                        )
-                if 'datasets' in global_configs:
-                    for i, dataset in enumerate(model['datasets']):
-                        model['datasets'][i] = ConfigReader._merge_configs_by_identifier(
-                            global_configs['datasets'], dataset, 'name'
+        models = config['models']
+        for model in models:
+            if 'launchers' in global_configs:
+                for i, launcher_entry in enumerate(model['launchers']):
+                    model['launchers'][i] = ConfigReader._merge_configs_by_identifier(
+                        global_configs['launchers'], launcher_entry, 'framework'
+                    )
+            if 'datasets' in global_configs:
+                for i, dataset in enumerate(model['datasets']):
+                    model['datasets'][i] = ConfigReader._merge_configs_by_identifier(
+                        global_configs['datasets'], dataset, 'name'
+                    )
+
+        config['models'] = models
+        return config
+
+    @staticmethod
+    def _merge_pipelines_config(global_config, local_config, args):
+        config = copy.deepcopy(local_config)
+        pipelines = []
+        raw_pipelines = local_config['pipelines']
+        for pipeline in raw_pipelines:
+            device_infos = pipeline.get('device_info', [])
+            if not device_infos and 'target_devices' in args and args.target_devices:
+                device_infos = [{'device': device} for device in args.target_devices]
+            per_device_pipelines = []
+            for device_info in device_infos:
+                copy_pipeline = copy.deepcopy(pipeline)
+                for stage in copy_pipeline['stages']:
+                    if 'launcher' in stage:
+                        stage['launcher'].update(device_info)
+                        if global_config and global_config is not None and 'launchers' in global_config:
+                            stage['launcher'] = ConfigReader._merge_configs_by_identifier(
+                                global_config['launchers'], stage['launcher'], 'framework'
+                            )
+                    if 'dataset' in stage and global_config is not None and 'datasets' in global_config:
+                        dataset = stage['dataset']
+                        stage['dataset'] = ConfigReader._merge_configs_by_identifier(
+                            global_config['datasets'], dataset, 'name'
                         )
+                per_device_pipelines.append(copy_pipeline)
+            pipelines.extend(per_device_pipelines)
+        config['pipelines'] = pipelines
 
-            return config
+        return config
 
-        def _merge_pipelines_config(global_config, local_config, args):
-            config = copy.deepcopy(local_config)
-            pipelines = []
-            raw_pipelines = local_config['pipelines']
-            for pipeline in raw_pipelines:
-                device_infos = pipeline.get('device_info', [])
-                if not device_infos:
-                    device_infos = [{'device': device} for device in args.target_devices]
-                per_device_pipelines = []
-                for device_info in device_infos:
-                    copy_pipeline = copy.deepcopy(pipeline)
-                    for stage in copy_pipeline['stages']:
-                        if 'launcher' in stage:
-                            stage['launcher'].update(device_info)
-                            if global_config and global_config is not None and 'launchers' in global_config:
-                                stage['launcher'] = ConfigReader._merge_configs_by_identifier(
-                                    global_config['launchers'], stage['launcher'], 'framework'
-                                )
-                        if 'dataset' in stage and global_config is not None and 'datasets' in global_config:
-                            dataset = stage['dataset']
-                            stage['dataset'] = ConfigReader._merge_configs_by_identifier(
-                                global_configs['datasets'], dataset, 'name'
-                            )
-                    per_device_pipelines.append(copy_pipeline)
-                pipelines.extend(per_device_pipelines)
-            config['pipelines'] = pipelines
+    @staticmethod
+    def _merge_module_config(global_config, local_config, args):
 
+        config = copy.deepcopy(local_config)
+        if not global_config:
             return config
 
+        for evaluation in config['evaluations']:
+            if 'module_config' not in evaluation:
+                continue
+            module_config = evaluation['module_config']
+            if 'launchers' in module_config and 'launchers' in global_config:
+                for i, launcher_entry in enumerate(module_config['launchers']):
+                    module_config['launchers'][i] = ConfigReader._merge_configs_by_identifier(
+                        global_config['launchers'], launcher_entry, 'framework'
+                    )
+            if 'datasets' in module_config and 'datasets' in global_config:
+                for i, dataset in enumerate(module_config['datasets']):
+                    module_config['datasets'][i] = ConfigReader._merge_configs_by_identifier(
+                        global_config['datasets'], dataset, 'name'
+                    )
+
+        return config
+
+    @staticmethod
+    def _merge_configs(global_configs, local_config, arguments, mode='models'):
         functors_by_mode = {
-            'models': _merge_models_config,
-            'pipelines': _merge_pipelines_config
+            'models': ConfigReader._merge_models_config,
+            'pipelines': ConfigReader._merge_pipelines_config,
+            'evaluations': ConfigReader._merge_module_config
         }
 
         return functors_by_mode[mode](global_configs, local_config, arguments)
@@ -252,85 +318,41 @@ def _merge_configs_by_identifier(global_config, local_config, identifier):
     @staticmethod
     def _merge_paths_with_prefixes(arguments, config, mode='models'):
         args = arguments if isinstance(arguments, dict) else vars(arguments)
-
-        def merge_entry_paths(keys, value):
-            for field, argument in keys.items():
-                if field not in value:
-                    continue
-
-                config_path = Path(value[field])
-                if config_path.is_absolute():
-                    value[field] = Path(value[field])
-                    continue
-
-                if argument not in args or not args[argument]:
-                    continue
-
-                if not args[argument].is_dir():
-                    raise ConfigError('argument: {} should be a directory'.format(argument))
-                value[field] = args[argument] / config_path
-
-        def process_config(
-                config_item, entries_paths, dataset_identifier='datasets',
-                launchers_identifier='launchers', identifiers_mapping=None
-        ):
-
-            def process_dataset(datasets_configs):
-                if not isinstance(datasets_configs, list):
-                    datasets_configs = [datasets_configs]
-                for datasets_config in datasets_configs:
-                    annotation_conversion_config = datasets_config.get('annotation_conversion')
-                    if annotation_conversion_config:
-                        command_line_conversion = (create_command_line_mapping(annotation_conversion_config, 'source'))
-                        merge_entry_paths(command_line_conversion, annotation_conversion_config)
-                    if 'preprocessing' in datasets_config:
-                        for preprocessor in datasets_config['preprocessing']:
-                            command_line_preprocessing = (create_command_line_mapping(preprocessor, 'models'))
-                            merge_entry_paths(command_line_preprocessing, preprocessor)
-
-            def process_launchers(launchers_configs):
-                if not isinstance(launchers_configs, list):
-                    launchers_configs = [launchers_configs]
-
-                for launcher_config in launchers_configs:
-                    adapter_config = launcher_config.get('adapter')
-                    if not isinstance(adapter_config, dict):
-                        continue
-                    command_line_adapter = (create_command_line_mapping(adapter_config, 'models'))
-                    merge_entry_paths(command_line_adapter, adapter_config)
-
-            for entry, command_line_arg in entries_paths.items():
-                entry_id = entry if not identifiers_mapping else identifiers_mapping[entry]
-                if entry_id not in config_item:
-                    continue
-
-                if entry_id == dataset_identifier:
-                    process_dataset(config_item[entry_id])
-
-                if entry_id == launchers_identifier:
-                    launchers_configs = config_item[entry_id]
-                    process_launchers(launchers_configs)
-
-                config_entries = config_item[entry_id]
-                if not isinstance(config_entries, list):
-                    config_entries = [config_entries]
-                for config_entry in config_entries:
-                    merge_entry_paths(command_line_arg, config_entry)
+        for argument, env_var in COMMAND_LINE_ARGS_AS_ENV_VARS.items():
+            if argument not in args or args[argument] is None:
+                env_var_value = os.environ.get(env_var)
+                if env_var_value is not None:
+                    args[argument] = Path(env_var_value)
 
         def process_models(config, entries_paths):
             for model in config['models']:
-                process_config(model, entries_paths)
+                process_config(model, entries_paths, args)
 
         def process_pipelines(config, entries_paths):
             identifiers_mapping = {'datasets': 'dataset', 'launchers': 'launcher', 'reader': 'reader'}
             entries_paths.update({'reader': {'data_source': 'source'}})
             for pipeline in config['pipelines']:
                 for stage in pipeline['stages']:
-                    process_config(stage, entries_paths, 'dataset', 'launcher', identifiers_mapping)
+                    process_config(stage, entries_paths, args, 'dataset', 'launcher', identifiers_mapping)
+
+        def process_modules(config, entries_paths):
+            for evaluation in config['evaluations']:
+                module_config = evaluation.get('module_config')
+                if not module_config:
+                    continue
+                process_config(module_config, entries_paths, args)
+                if 'network_info' in module_config:
+                    networks_info = module_config['network_info']
+                    if isinstance(networks_info, dict):
+                        for _, params in networks_info.items():
+                            merge_entry_paths(entries_paths['launchers'], params, args)
+                    if isinstance(networks_info, list):
+                        merge_entry_paths(entries_paths['launchers'], networks_info, args)
 
         functors_by_mode = {
             'models': process_models,
-            'pipelines': process_pipelines
+            'pipelines': process_pipelines,
+            'evaluations': process_modules
         }
 
         processing_func = functors_by_mode[mode]
@@ -355,16 +377,18 @@ def merge_dlsdk_launcher_args(arguments, launcher_entry, update_launcher_entry):
             if models_prefix:
                 launcher_entry['_models_prefix'] = models_prefix
 
-            if 'converted_models' not in arguments or not arguments.converted_models:
-                return launcher_entry
-
-            mo_params = launcher_entry.get('mo_params', {})
+            if 'deprecated_ir_v7' in arguments and arguments.deprecated_ir_v7:
+                mo_flags = launcher_entry.get('mo_flags', [])
+                mo_flags.append('generate_deprecated_IR_V7')
+                launcher_entry['mo_flags'] = mo_flags
 
-            mo_params.update({
-                'output_dir': merge_converted_model_path(arguments.converted_models, mo_params.get('output_dir'))
-            })
+            if 'converted_models' in arguments and arguments.converted_models:
+                mo_params = launcher_entry.get('mo_params', {})
+                mo_params.update({
+                    'output_dir': merge_converted_model_path(arguments.converted_models, mo_params.get('output_dir'))
+                })
 
-            launcher_entry['mo_params'] = mo_params
+                launcher_entry['mo_params'] = mo_params
 
             if 'aocl' in arguments and arguments.aocl:
                 launcher_entry['_aocl'] = arguments.aocl
@@ -395,14 +419,27 @@ def merge_pipelines(config, arguments, update_launcher_entry):
                 for stage in pipeline['stages']:
                     if 'launcher' in stage:
                         merge_dlsdk_launcher_args(arguments, stage['launcher'], update_launcher_entry)
+
+        def merge_modules(config, arguments, update_launcher_entry):
+            for evaluation in config['evaluations']:
+                module_config = evaluation.get('module_config')
+                if not module_config:
+                    continue
+                if 'launchers' not in module_config:
+                    continue
+                for launcher in module_config['launchers']:
+                    merge_dlsdk_launcher_args(arguments, launcher, update_launcher_entry)
+
         functors_by_mode = {
             'models': merge_models,
-            'pipelines': merge_pipelines
+            'pipelines': merge_pipelines,
+            'evaluations': merge_modules
         }
 
         additional_keys = [
             'model_optimizer', 'tf_custom_op_config_dir',
             'tf_obj_detection_api_pipeline_config_path',
+            'transformations_config_dir',
             'cpu_extensions_mode', 'vpu_log_level'
         ]
         arguments_dict = arguments if isinstance(arguments, dict) else vars(arguments)
@@ -417,70 +454,140 @@ def merge_pipelines(config, arguments, update_launcher_entry):
 
     @staticmethod
     def _filter_launchers(config, arguments, mode='models'):
-        def filtered(launcher, targets):
-            target_tags = args.get('target_tags') or []
-            if target_tags:
-                if not contains_any(target_tags, launcher.get('tags', [])):
-                    return True
-
-            config_framework = launcher['framework'].lower()
-            target_framework = (args.get('target_framework') or config_framework).lower()
-            if config_framework != target_framework:
-                return True
+        functors_by_mode = {
+            'models': filter_models,
+            'pipelines': filter_pipelines,
+            'evaluations': filter_modules
+        }
 
-            return targets and launcher.get('device', '').lower() not in targets
+        args = arguments if isinstance(arguments, dict) else vars(arguments)
+        target_devices = to_lower_register(args.get('target_devices') or [])
+        filtering_mode = functors_by_mode[mode]
+        filtering_mode(config, target_devices, args)
 
-        def filter_models(config, target_devices):
-            models_after_filtration = []
-            for model in config['models']:
-                launchers_after_filtration = []
+    @staticmethod
+    def _separate_evaluations(config, mode='models'):
+        def _separate_models_evaluations(models_config):
+            evaluations = []
+            for model in models_config['models']:
                 launchers = model['launchers']
-                for launcher in launchers:
-                    if 'device' not in launcher and target_devices:
-                        for device in target_devices:
-                            launcher_with_device = copy.deepcopy(launcher)
-                            launcher_with_device['device'] = device
-                            if not filtered(launcher_with_device, target_devices):
-                                launchers_after_filtration.append(launcher_with_device)
-                    if not filtered(launcher, target_devices):
-                        launchers_after_filtration.append(launcher)
-
-                if not launchers_after_filtration:
-                    warnings.warn('Model "{}" has no launchers'.format(model['name']))
+                datasets = model['datasets']
+                if not launchers:
                     continue
+                if len(launchers) == 1 and len(datasets) == 1:
+                    evaluations.append(model)
+                    continue
+                for launcher in model['launchers']:
+                    model_evaluations = []
+                    model_config_copy_launcher = copy.deepcopy(model)
+                    model_config_copy_launcher['launchers'] = [launcher]
+
+                    for dataset in model_config_copy_launcher['datasets']:
+                        model_config_copy_dataset = copy.deepcopy(model_config_copy_launcher)
+                        model_config_copy_dataset['datasets'] = [dataset]
+                        model_evaluations.append(model_config_copy_dataset)
+
+                    evaluations.extend(model_evaluations)
+
+            models_config['models'] = evaluations
+
+        def _separate_modules_evaluations(modules_config):
+            evals = modules_config['evaluations']
+            eval_list = []
+            for evaluation in evals:
+                if 'module_config' not in evaluation:
+                    eval_list.append(evaluation)
+                    continue
+                module_config = evaluation['module_config']
+                launchers = module_config.get('launchers', [])
+                datasets = module_config.get('datasets', [])
+                eval_config_list = []
+                for launcher in launchers:
+                    copy_module_config = copy.deepcopy(module_config)
+                    copy_module_config['launchers'] = [launcher]
+                    if not datasets:
+                        eval_config_list.append(copy_module_config)
+                        continue
+                    for dataset in datasets:
+                        copy_evaluation_for_dataset = copy.deepcopy(copy_module_config)
+                        copy_evaluation_for_dataset['datasets'] = [dataset]
+                        eval_config_list.append(copy_evaluation_for_dataset)
+                for eval_config in eval_config_list:
+                    copy_evaluation = copy.deepcopy(evaluation)
+                    copy_evaluation['module_config'] = eval_config
+                    eval_list.append(copy_evaluation)
+
+            modules_config['evaluations'] = eval_list
+
+        mode_func = {
+            'models': _separate_models_evaluations,
+            'evaluations': _separate_modules_evaluations
+        }
 
-                model['launchers'] = launchers_after_filtration
-                models_after_filtration.append(model)
-
-            config['models'] = models_after_filtration
+        separator = mode_func.get(mode)
+        if not separator:
+            return
+        separator(config)
 
-        def filter_pipelines(config, target_devices):
-            saved_pipelines = []
-            for pipeline in config['pipelines']:
-                filtered_pipeline = False
-                for stage in pipeline['stages']:
-                    if 'launcher' in stage:
-                        if filtered(stage['launcher'], target_devices):
-                            filtered_pipeline = True
-                        break
-                if filtered_pipeline:
+    @staticmethod
+    def _previous_configuration_parameters_sharing(config, mode='models'):
+        def _share_params_models(models_config):
+            shared_params = {parameter: None for parameter in CONFIG_SHARED_PARAMETERS}
+            for model in models_config['models']:
+                launchers = model['launchers']
+                if not launchers:
                     continue
-                saved_pipelines.append(pipeline)
-            config['pipelines'] = saved_pipelines
-
-        functors_by_mode = {
-            'models': filter_models,
-            'pipelines': filter_pipelines
+                for launcher in model['launchers']:
+                    for parameter in CONFIG_SHARED_PARAMETERS:
+                        if parameter in launcher:
+                            if shared_params[parameter] is not None:
+                                launcher['_prev_{}'.format(parameter)] = shared_params[parameter]
+                            shared_params[parameter] = launcher[parameter]
+
+        def _share_params_modules(modules_config):
+            shared_params = {parameter: None for parameter in CONFIG_SHARED_PARAMETERS}
+            for evaluation in modules_config['evaluations']:
+                if 'module_config' not in evaluation:
+                    continue
+                launchers = evaluation['module_config'].get('launchers')
+                for launcher in launchers:
+                    for parameter in CONFIG_SHARED_PARAMETERS:
+                        if parameter in launcher:
+                            if shared_params[parameter] is not None:
+                                launcher['_prev_{}'.format(parameter)] = shared_params[parameter]
+                            shared_params[parameter] = launcher[parameter]
+
+        def _share_params_pipelines(pipelines_config):
+            shared_params = {parameter: None for parameter in CONFIG_SHARED_PARAMETERS}
+            for pipeline in pipelines_config['pipelines']:
+                for stage in pipeline['stages']:
+                    launcher = stage.get('launcher', {})
+                    for parameter in CONFIG_SHARED_PARAMETERS:
+                        if parameter in launcher:
+                            if shared_params[parameter] is not None:
+                                launcher['_prev_{}'.format(parameter)] = shared_params[parameter]
+                            shared_params[parameter] = launcher[parameter]
+        mode_func = {
+            'models': _share_params_models,
+            'evaluations': _share_params_modules,
+            'pipelines': _share_params_pipelines
         }
 
-        args = arguments if isinstance(arguments, dict) else vars(arguments)
-        target_devices = to_lower_register(args.get('target_devices') or [])
-        filtering_mode = functors_by_mode[mode]
-        filtering_mode(config, target_devices)
-
+        processor = mode_func.get(mode)
+        if not processor:
+            return
+        processor(config)
 
     @staticmethod
     def convert_paths(config):
+        definitions = os.environ.get(DEFINITION_ENV_VAR)
+        if definitions:
+            definitions = read_yaml(Path(definitions))
+            ConfigReader._prepare_global_configs(definitions)
+            config = ConfigReader._merge_configs(definitions, config, {}, 'models')
+        if COMMAND_LINE_ARGS_AS_ENV_VARS['source'] in os.environ:
+            ConfigReader._merge_paths_with_prefixes({}, config, 'models')
+
         def convert_launcher_paths(launcher_config):
             for key, path in launcher_config.items():
                 if key not in ENTRIES_PATHS['launchers']:
@@ -503,7 +610,7 @@ def convert_dataset_paths(dataset_config):
                 for preprocessor in dataset_config['preprocessing']:
                     path_preprocessing = (create_command_line_mapping(preprocessor, None))
                     for path in path_preprocessing:
-                        preprocessor[path] = Path(path_preprocessing[path])
+                        preprocessor[path] = Path(preprocessor[path])
 
             for key, path in dataset_config.items():
                 if key not in ENTRIES_PATHS['datasets']:
@@ -513,8 +620,10 @@ def convert_dataset_paths(dataset_config):
         for model in config['models']:
             for launcher_config in model['launchers']:
                 convert_launcher_paths(launcher_config)
-            for dataset_config in model['datasets']:
+            datasets = model['datasets'].values() if isinstance(model['datasets'], dict) else model['datasets']
+            for dataset_config in datasets:
                 convert_dataset_paths(dataset_config)
+        return config
 
 
 def create_command_line_mapping(config, value):
@@ -524,3 +633,163 @@ def create_command_line_mapping(config, value):
             mapping[key] = value
 
     return mapping
+
+
+def filtered(launcher, targets, args):
+    target_tags = args.get('target_tags') or []
+    if target_tags:
+        if not contains_any(target_tags, launcher.get('tags', [])):
+            return True
+
+    config_framework = launcher['framework'].lower()
+    target_framework = (args.get('target_framework') or config_framework).lower()
+    if config_framework != target_framework:
+        return True
+
+    return targets and launcher.get('device', '').lower() not in targets
+
+
+def filter_models(config, target_devices, args):
+    models_after_filtration = []
+    for model in config['models']:
+        launchers_after_filtration = []
+        launchers = model['launchers']
+        for launcher in launchers:
+            if 'device' not in launcher and target_devices:
+                for device in target_devices:
+                    launcher_with_device = copy.deepcopy(launcher)
+                    launcher_with_device['device'] = device
+                    if not filtered(launcher_with_device, target_devices, args):
+                        launchers_after_filtration.append(launcher_with_device)
+                continue
+            if not filtered(launcher, target_devices, args):
+                launchers_after_filtration.append(launcher)
+
+        if not launchers_after_filtration:
+            warnings.warn('Model "{}" has no launchers'.format(model['name']))
+            continue
+
+        model['launchers'] = launchers_after_filtration
+        models_after_filtration.append(model)
+
+    config['models'] = models_after_filtration
+
+
+def filter_pipelines(config, target_devices, args):
+    saved_pipelines = []
+    for pipeline in config['pipelines']:
+        filtered_pipeline = False
+        for stage in pipeline['stages']:
+            if 'launcher' in stage:
+                if filtered(stage['launcher'], target_devices, args):
+                    filtered_pipeline = True
+                break
+        if filtered_pipeline:
+            continue
+        saved_pipelines.append(pipeline)
+    config['pipelines'] = saved_pipelines
+
+
+def filter_modules(config, target_devices, args):
+    filtered_evals = []
+    for evaluation in config['evaluations']:
+        if 'module_config' not in evaluation or 'launchers' not in evaluation['module_config']:
+            if target_devices:
+                warnings.warn(
+                    'Information about launcher is not provided in config for {}. '
+                    'Filtration can not be done'.format(evaluation['name'])
+                )
+            filtered_evals.append(evaluation)
+            continue
+        module_config = evaluation['module_config']
+        launchers = module_config['launchers']
+        if target_devices:
+            launchers_without_device = [launcher for launcher in launchers if 'device' not in launcher]
+            for launcher in launchers_without_device:
+                for device in target_devices:
+                    launcher_with_device = copy.deepcopy(launcher)
+                    launcher_with_device['device'] = device
+                    launchers.append(launcher_with_device)
+        launchers = [
+            launcher for launcher in launchers if not filtered(launcher, target_devices, args)
+        ]
+        if not launchers:
+            warnings.warn('Model "{}" has no launchers'.format(evaluation['name']))
+        evaluation['module_config']['launchers'] = launchers
+        filtered_evals.append(evaluation)
+    config['evaluations'] = filtered_evals
+
+
+def process_config(
+        config_item, entries_paths, args, dataset_identifier='datasets',
+        launchers_idenitfier='launchers', identifers_mapping=None
+):
+    def process_dataset(datasets_configs):
+        if not isinstance(datasets_configs, list):
+            datasets_configs = [datasets_configs]
+        for datasets_config in datasets_configs:
+            annotation_conversion_config = datasets_config.get('annotation_conversion')
+            if annotation_conversion_config:
+                command_line_conversion = (create_command_line_mapping(annotation_conversion_config, 'source'))
+                merge_entry_paths(command_line_conversion, annotation_conversion_config, args)
+            if 'preprocessing' in datasets_config:
+                for preprocessor in datasets_config['preprocessing']:
+                    command_line_preprocessing = (create_command_line_mapping(preprocessor, 'models'))
+                    merge_entry_paths(command_line_preprocessing, preprocessor, args)
+
+    def process_launchers(launchers_configs):
+        if not isinstance(launchers_configs, list):
+            launchers_configs = [launchers_configs]
+
+        for launcher_config in launchers_configs:
+            adapter_config = launcher_config.get('adapter')
+            if not isinstance(adapter_config, dict):
+                continue
+            command_line_adapter = (create_command_line_mapping(adapter_config, 'models'))
+            merge_entry_paths(command_line_adapter, adapter_config, args)
+
+    for entry, command_line_arg in entries_paths.items():
+        entry_id = entry if not identifers_mapping else identifers_mapping[entry]
+        if entry_id not in config_item:
+            continue
+
+        if entry_id == dataset_identifier:
+            process_dataset(config_item[entry_id])
+
+        if entry_id == launchers_idenitfier:
+            launchers_configs = config_item[entry_id]
+            process_launchers(launchers_configs)
+
+        config_entires = config_item[entry_id]
+        if not isinstance(config_entires, list):
+            config_entires = [config_entires]
+        for config_entry in config_entires:
+            merge_entry_paths(command_line_arg, config_entry, args)
+
+
+def merge_entry_paths(keys, value, args):
+    for field, argument in keys.items():
+        if field not in value:
+            continue
+
+        config_path = Path(value[field])
+        if config_path.is_absolute():
+            value[field] = Path(value[field])
+            continue
+
+        if not argument in args or not args[argument]:
+            continue
+
+        if not args[argument].is_dir():
+            raise ConfigError('argument: {} should be a directory'.format(argument))
+        value[field] = args[argument] / config_path
+
+
+def get_mode(config):
+    evaluation_keys = [key for key in config if key != 'global_definitions']
+    if not evaluation_keys:
+        raise ConfigError('Invalid config structure. No evaluations detected.')
+    if len(evaluation_keys) > 1:
+        raise ConfigError('Multiple evaluation types in the one config is not supported. '
+                          'Please separate on several configs.')
+    return next(iter(evaluation_keys))
diff --git a/tools/accuracy_checker/accuracy_checker/config/config_validator.py b/tools/accuracy_checker/accuracy_checker/config/config_validator.py
index dfd55065185..d72dab38957 100644
--- a/tools/accuracy_checker/accuracy_checker/config/config_validator.py
+++ b/tools/accuracy_checker/accuracy_checker/config/config_validator.py
@@ -52,14 +52,17 @@ def raise_error(self, value, field_uri, reason=None):
 
         raise ConfigError(error_message.format(value, field_uri))
 
+
 class _ExtraArgumentBehaviour(enum.Enum):
     WARN = 'warn'
     IGNORE = 'ignore'
     ERROR = 'error'
 
+
 def _is_dict_like(entry):
     return hasattr(entry, '__iter__') and hasattr(entry, '__getitem__')
 
+
 class ConfigValidator(BaseValidator):
     WARN_ON_EXTRA_ARGUMENT = _ExtraArgumentBehaviour.WARN
     ERROR_ON_EXTRA_ARGUMENT = _ExtraArgumentBehaviour.ERROR
@@ -170,8 +173,13 @@ def __init__(self, choices=None, regex=None, case_sensitive=False, allow_own_cho
         super().__init__(**kwargs)
         self.choices = choices if case_sensitive or not choices else list(map(str.lower, choices))
         self.allow_own_choice = allow_own_choice
-        self._regex = re.compile(regex, flags=re.IGNORECASE if not case_sensitive else 0) if regex else None
         self.case_sensitive = case_sensitive
+        self.set_regex(regex)
+
+    def set_regex(self, regex):
+        if regex is None:
+            self._regex = regex
+        self._regex = re.compile(regex, flags=re.IGNORECASE if not self.case_sensitive else 0) if regex else None
 
     def validate(self, entry, field_uri=None):
         super().validate(entry, field_uri)
@@ -266,7 +274,8 @@ def type(self):
 
 class InputField(BaseField):
     INPUTS_TYPES = ('CONST_INPUT', 'INPUT', 'IMAGE_INFO')
-    LAYOUT_TYPES = ['NCHW', 'NHWC', 'NCWH', 'NWHC']
+    LAYOUT_TYPES = ('NCHW', 'NHWC', 'NCWH', 'NWHC')
+    PRECISIONS = ('FP32', 'FP16', 'U8', 'U16', 'I8', 'I16', 'I32', 'I64')
 
     def __init__(self, **kwargs):
         super().__init__(**kwargs)
@@ -276,6 +285,7 @@ def __init__(self, **kwargs):
         self.layout = StringField(optional=True, choices=InputField.LAYOUT_TYPES,
                                   description="Layout: " + ', '.join(InputField.LAYOUT_TYPES))
         self.shape = BaseField(optional=True, description="Input shape.")
+        self.precision = StringField(optional=True, description='Input precision', choices=InputField.PRECISIONS)
 
     def validate(self, entry, field_uri=None):
         entry['optional'] = entry['type'] != 'CONST_INPUT'
diff --git a/tools/accuracy_checker/accuracy_checker/data_readers/README.md b/tools/accuracy_checker/accuracy_checker/data_readers/README.md
index 5b36b161ebf..8e02eec320e 100644
--- a/tools/accuracy_checker/accuracy_checker/data_readers/README.md
+++ b/tools/accuracy_checker/accuracy_checker/data_readers/README.md
@@ -30,10 +30,16 @@ reader:
 AccuracyChecker supports following list of data readers:
 * `opencv_imread` - read images using OpenCV library. Default color space is BGR.
 * `pillow_imread` - read images using Pillow library. Default color space is RGB.
-* `scipy_imread` - read images using Scipy library.
-* `tf_imred`- read images using Tensorflow. Default color space is RGB. Requires Tensorflow installation.
+* `scipy_imread` - read images using similar approach as in `scipy.misc.imread` 
+```
+Note: since 1.3.0 version the image processing module is not a part of scipy library. This reader does not use scipy anymore.
+```
+* `tf_imread`- read images using TensorFlow. Default color space is RGB. Requires TensorFlow installation.
 * `opencv_capture` - read frames from video using OpenCV.
 * `json_reader` - read value from json file.
   * `key` - key for reading from stored in json dictionary.
 * `annotation_features_extractor` - read features from annotation.
   * `features` - list of features. All features should be fields of annotation representation.
+* `numpy_reader` - read numpy dumped files
+* `nifti_reader` - read NifTI data format
+  * `channels_first` - allows read nifti files and transpose in order where channels first (Optional, default False)
diff --git a/tools/accuracy_checker/accuracy_checker/data_readers/__init__.py b/tools/accuracy_checker/accuracy_checker/data_readers/__init__.py
index dd9216749c2..b1f3669c58a 100644
--- a/tools/accuracy_checker/accuracy_checker/data_readers/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/data_readers/__init__.py
@@ -29,7 +29,9 @@
 
     DataRepresentation,
     ClipIdentifier,
-    create_reader
+    MultiFramesInputIdentifier,
+    create_reader,
+    REQUIRES_ANNOTATIONS
 )
 
 __all__ = [
@@ -48,5 +50,7 @@
 
     'DataRepresentation',
     'ClipIdentifier',
-    'create_reader'
+    'MultiFramesInputIdentifier',
+    'create_reader',
+    'REQUIRES_ANNOTATIONS'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/data_readers/data_reader.py b/tools/accuracy_checker/accuracy_checker/data_readers/data_reader.py
index f28bd2972b8..256baf2c261 100644
--- a/tools/accuracy_checker/accuracy_checker/data_readers/data_reader.py
+++ b/tools/accuracy_checker/accuracy_checker/data_readers/data_reader.py
@@ -19,14 +19,28 @@
 from collections import OrderedDict, namedtuple
 import re
 import cv2
-from PIL import Image
-import scipy.misc
 import numpy as np
-import nibabel as nib
+
+try:
+    import tensorflow as tf
+except ImportError as import_error:
+    tf = None
+
+try:
+    from PIL import Image
+except ImportError as import_error:
+    Image = None
+
+try:
+    import nibabel as nib
+except ImportError:
+    nib = None
 
 from ..utils import get_path, read_json, zipped_transform, set_image_metadata, contains_all
 from ..dependency import ClassProvider
-from ..config import BaseField, StringField, ConfigValidator, ConfigError, DictField, ListField
+from ..config import BaseField, StringField, ConfigValidator, ConfigError, DictField, ListField, BoolField
+
+REQUIRES_ANNOTATIONS = ['annotation_features_extractor', ]
 
 
 class DataRepresentation:
@@ -39,10 +53,11 @@ def __init__(self, data, meta=None, identifier=''):
         elif isinstance(data, list) and np.isscalar(data[0]):
             self.metadata['image_size'] = len(data)
         else:
-            self.metadata['image_size'] = data.shape if not isinstance(data, list) else data[0].shape
+            self.metadata['image_size'] = data.shape if not isinstance(data, list) else np.shape(data[0])
 
 
 ClipIdentifier = namedtuple('ClipIdentifier', ['video', 'clip_id', 'frames'])
+MultiFramesInputIdentifier = namedtuple('MultiFramesInputIdentifier', ['input_id', 'frames'])
 
 
 def create_reader(config):
@@ -80,6 +95,7 @@ def __init__(self, data_source, config=None, **kwargs):
         self.read_dispatcher = singledispatch(self.read)
         self.read_dispatcher.register(list, self._read_list)
         self.read_dispatcher.register(ClipIdentifier, self._read_clip)
+        self.read_dispatcher.register(MultiFramesInputIdentifier, self._read_frames_multi_input)
 
         self.validate_config()
         self.configure()
@@ -117,9 +133,19 @@ def _read_clip(self, data_id):
         frames_identifiers = [video / frame for frame in data_id.frames]
         return self.read_dispatcher(frames_identifiers)
 
+    def _read_frames_multi_input(self, data_id):
+        return self.read_dispatcher(data_id.frames)
+
     def read_item(self, data_id):
         return DataRepresentation(self.read_dispatcher(data_id), identifier=data_id)
 
+    @property
+    def name(self):
+        return self.__provider__
+
+    def reset(self):
+        pass
+
 
 class ReaderCombinerConfig(ConfigValidator):
     type = StringField()
@@ -168,6 +194,8 @@ class PillowImageReader(BaseReader):
 
     def __init__(self, data_source, config=None, **kwargs):
         super().__init__(data_source, config)
+        if Image is None:
+            raise ValueError('Pillow is not installed, please install it')
         self.convert_to_rgb = True
 
     def read(self, data_id):
@@ -180,8 +208,18 @@ def read(self, data_id):
 class ScipyImageReader(BaseReader):
     __provider__ = 'scipy_imread'
 
+    def __init__(self, data_source, config=None, **kwargs):
+        super().__init__(data_source, config)
+        if Image is None:
+            raise ValueError('Pillow is not installed, please install it')
+
     def read(self, data_id):
-        return np.array(scipy.misc.imread(str(get_path(self.data_source / data_id))))
+        # reimplementation scipy.misc.imread
+        image = Image.open(str(get_path(self.data_source / data_id)))
+        if image.mode == 'P':
+            image = image.convert('RGBA') if 'transparency' in image.info else image.convert('RGB')
+
+        return np.array(image)
 
 
 class OpenCVFrameReader(BaseReader):
@@ -214,6 +252,10 @@ def configure(self):
         self.data_source = get_path(self.data_source)
         self.videocap = cv2.VideoCapture(str(self.data_source))
 
+    def reset(self):
+        self.current = -1
+        self.videocap.set(cv2.CAP_PROP_POS_FRAMES, 0)
+
 
 class JSONReaderConfig(ConfigValidator):
     type = StringField()
@@ -254,15 +296,30 @@ def read(self, data_id):
         return float(data_id.split(":")[1])
 
 
+class NiftyReaderConfig(ConfigValidator):
+    type = StringField(optional=True)
+    channels_first = BoolField(optional=True, default=False)
+
+
 class NiftiImageReader(BaseReader):
     __provider__ = 'nifti_reader'
 
+    def validate_config(self):
+        if self.config:
+            config_validator = NiftyReaderConfig('nifti_reader_config')
+            config_validator.validate(self.config)
+
+    def configure(self):
+        if nib is None:
+            raise ImportError('nifty backend for image reading requires nibabel. Please install it before usage.')
+        self.channels_first = self.config.get('channels_first', False) if self.config else False
+
     def read(self, data_id):
         nib_image = nib.load(str(get_path(self.data_source / data_id)))
         image = np.array(nib_image.dataobj)
         if len(image.shape) != 4:  # Make sure 4D
             image = np.expand_dims(image, -1)
-        image = np.swapaxes(np.array(image), 0, -2)
+        image = np.transpose(image, (3, 0, 1, 2) if self.channels_first else (2, 1, 0, 3))
 
         return image
 
@@ -279,12 +336,8 @@ class TensorflowImageReader(BaseReader):
 
     def __init__(self, data_source, config=None, **kwargs):
         super().__init__(data_source, config)
-        try:
-            import tensorflow as tf
-        except ImportError as import_error:
-            raise ConfigError(
-                'tf_imread reader disabled.Please, install Tensorflow before using. \n{}'.format(import_error.msg)
-            )
+        if tf is None:
+            raise ImportError('tf backend for image reading requires TensorFlow. Please install it before usage.')
 
         tf.enable_eager_execution()
 
@@ -307,11 +360,6 @@ class AnnotationFeaturesConfig(ConfigValidator):
 class AnnotationFeaturesReader(BaseReader):
     __provider__ = 'annotation_features_extractor'
 
-    def __init__(self, data_source, config=None, annotations=None):
-        super().__init__(annotations, config)
-        self.counter = 0
-        self.data_source = annotations
-
     def configure(self):
         self.feature_list = self.config['features']
         if not contains_all(self.data_source[0].__dict__, self.feature_list):
@@ -319,9 +367,11 @@ def configure(self):
                 'annotation_class prototype does not contain provided features {}'.format(', '.join(self.feature_list))
             )
         self.single = len(self.feature_list) == 1
+        self.counter = 0
+        self.subset = range(len(self.data_source))
 
     def read(self, data_id):
-        relevant_annotation = self.data_source[self.counter]
+        relevant_annotation = self.data_source[self.subset[self.counter]]
         self.counter += 1
         features = [getattr(relevant_annotation, feature) for feature in self.feature_list]
         if self.single:
@@ -330,3 +380,7 @@ def read(self, data_id):
 
     def _read_list(self, data_id):
         return self.read(data_id)
+
+    def reset(self):
+        self.subset = range(len(self.data_source))
+        self.counter = 0
diff --git a/tools/accuracy_checker/accuracy_checker/dataset.py b/tools/accuracy_checker/accuracy_checker/dataset.py
index f5a76e06f4f..e924fda8101 100644
--- a/tools/accuracy_checker/accuracy_checker/dataset.py
+++ b/tools/accuracy_checker/accuracy_checker/dataset.py
@@ -20,9 +20,9 @@
 
 from .annotation_converters import BaseFormatConverter, save_annotation, make_subset, analyze_dataset
 from .config import ConfigValidator, StringField, PathField, ListField, DictField, BaseField, NumberField, ConfigError
-from .utils import JSONDecoderWithAutoConversion, read_json, get_path, contains_all, set_image_metadata
-from .representation import BaseRepresentation
-from .data_readers import DataReaderField
+from .utils import JSONDecoderWithAutoConversion, read_json, get_path, contains_all, set_image_metadata, OrderedSet
+from .representation import BaseRepresentation, ReIdentificationClassificationAnnotation, ReIdentificationAnnotation
+from .data_readers import DataReaderField, REQUIRES_ANNOTATIONS
 
 
 class DatasetConfig(ConfigValidator):
@@ -41,6 +41,7 @@ class DatasetConfig(ConfigValidator):
     subsample_size = BaseField(optional=True)
     subsample_seed = NumberField(value_type=int, min_value=0, optional=True)
     analyze_dataset = BaseField(optional=True)
+    segmentation_masks_source = PathField(is_directory=True, optional=True)
 
 
 class Dataset:
@@ -50,9 +51,31 @@ def __init__(self, config_entry):
         self.iteration = 0
         dataset_config = DatasetConfig('Dataset')
         dataset_config.validate(self._config)
+        self._images_dir = Path(self._config.get('data_source', ''))
+        self._load_annotation()
+
+    def _load_annotation(self):
+        def create_subset(subsample_size, subsample_seed):
+            if isinstance(subsample_size, str):
+                if subsample_size.endswith('%'):
+                    try:
+                        subsample_size = float(subsample_size[:-1])
+                    except ValueError:
+                        raise ConfigError('invalid value for subsample_size: {}'.format(subsample_size))
+                    if subsample_size <= 0:
+                        raise ConfigError('subsample_size should be > 0')
+                    subsample_size *= len(annotation) / 100
+                    subsample_size = int(subsample_size) or 1
+            try:
+                subsample_size = int(subsample_size)
+            except ValueError:
+                raise ConfigError('invalid value for subsample_size: {}'.format(subsample_size))
+            if subsample_size < 1:
+                raise ConfigError('subsample_size should be > 0')
+            return make_subset(annotation, subsample_size, subsample_seed)
+
         annotation, meta = None, None
         use_converted_annotation = True
-        self._images_dir = Path(self._config.get('data_source', ''))
         if 'annotation' in self._config:
             annotation_file = Path(self._config['annotation'])
             if annotation_file.exists():
@@ -66,13 +89,10 @@ def __init__(self, config_entry):
             raise ConfigError('path to converted annotation or data for conversion should be specified')
 
         subsample_size = self._config.get('subsample_size')
-        if subsample_size:
+        if subsample_size is not None:
             subsample_seed = self._config.get('subsample_seed', 666)
-            if isinstance(subsample_size, str):
-                if subsample_size.endswith('%'):
-                    subsample_size = float(subsample_size[:-1]) / 100 * len(annotation)
-            subsample_size = int(subsample_size)
-            annotation = make_subset(annotation, subsample_size, subsample_seed)
+
+            annotation = create_subset(subsample_size, subsample_seed)
 
         if self._config.get('analyze_dataset', False):
             analyze_dataset(annotation, meta)
@@ -85,7 +105,7 @@ def __init__(self, config_entry):
             save_annotation(annotation, meta, Path(annotation_name), meta_name)
 
         self._annotation = annotation
-        self._meta = meta
+        self._meta = meta or {}
         self.name = self._config.get('name')
         self.subset = None
 
@@ -98,7 +118,9 @@ def config(self):
         return deepcopy(self._config) #read-only
 
     def __len__(self):
-        return self.size
+        if self.subset:
+            return len(self.subset)
+        return len(self._annotation)
 
     @property
     def metadata(self):
@@ -110,15 +132,18 @@ def labels(self):
 
     @property
     def size(self):
-        if self.subset:
-            return len(self.subset)
+        return self.__len__()
+
+    @property
+    def full_size(self):
         return len(self._annotation)
 
     def __call__(self, context, *args, **kwargs):
-        batch_annotation = self.__getitem__(self.iteration)
+        batch_input_ids, batch_annotation = self.__getitem__(self.iteration)
         self.iteration += 1
         context.annotation_batch = batch_annotation
         context.identifiers_batch = [annotation.identifier for annotation in batch_annotation]
+        context.input_ids_batch = batch_input_ids
 
     def __getitem__(self, item):
         if self.size <= item * self.batch:
@@ -127,31 +152,67 @@ def __getitem__(self, item):
         batch_start = item * self.batch
         batch_end = min(self.size, batch_start + self.batch)
         if self.subset:
-            return [self._annotation[idx] for idx in self.subset[batch_start:batch_end]]
+            batch_ids = self.subset[batch_start:batch_end]
+            return batch_ids, [self._annotation[idx] for idx in batch_ids]
+        batch_ids = range(batch_start, batch_end)
 
-        return self._annotation[batch_start:batch_end]
+        return batch_ids, self._annotation[batch_start:batch_end]
 
-    def make_subset(self, ids=None, start=0, step=1, end=None):
+    def make_subset(self, ids=None, start=0, step=1, end=None, accept_pairs=False):
+        pairwise_subset = isinstance(
+            self._annotation[0], (ReIdentificationAnnotation, ReIdentificationClassificationAnnotation)
+        )
         if ids:
-            self.subset = ids
+            self.subset = ids if not pairwise_subset else self._make_subset_pairwise(ids, accept_pairs)
             return
         if not end:
             end = self.size
-        self.subset = range(start, end, step)
-
-    @staticmethod
-    def set_image_metadata(annotation, images):
-        image_sizes = []
-        data = images.data
-        if not isinstance(data, list):
-            data = [data]
-        for image in data:
-            image_sizes.append(image.shape)
-        annotation.set_image_size(image_sizes)
+        ids = range(start, end, step)
+        self.subset = ids if not pairwise_subset else self._make_subset_pairwise(ids, accept_pairs)
+
+    def _make_subset_pairwise(self, ids, add_pairs=False):
+        subsample_set = OrderedSet()
+        pairs_set = OrderedSet()
+        if isinstance(self._annotation[0], ReIdentificationClassificationAnnotation):
+            identifier_to_index = {annotation.identifier: index for index, annotation in enumerate(self._annotation)}
+            for idx in ids:
+                subsample_set.add(idx)
+                current_annotation = self._annotation[idx]
+                positive_pairs = [
+                    identifier_to_index[pair_identifier] for pair_identifier in current_annotation.positive_pairs
+                ]
+                pairs_set |= positive_pairs
+                negative_pairs = [
+                    identifier_to_index[pair_identifier] for pair_identifier in current_annotation.positive_pairs
+                ]
+                pairs_set |= negative_pairs
+        else:
+            for idx in ids:
+                subsample_set.add(idx)
+                selected_annotation = self._annotation[idx]
+                if not selected_annotation.query:
+                    query_for_person = [
+                        idx for idx, annotation in enumerate(self._annotation)
+                        if annotation.person_id == selected_annotation.person_id and annotation.query
+                    ]
+                    pairs_set |= OrderedSet(query_for_person)
+                else:
+                    gallery_for_person = [
+                        idx for idx, annotation in enumerate(self._annotation)
+                        if annotation.person_id == selected_annotation.person_id and not annotation.query
+                    ]
+                    pairs_set |= OrderedSet(gallery_for_person)
+
+        if add_pairs:
+            subsample_set |= pairs_set
+
+        return list(subsample_set)
 
     def set_annotation_metadata(self, annotation, image, data_source):
-        self.set_image_metadata(annotation, image.data)
+        set_image_metadata(annotation, image)
         annotation.set_data_source(data_source)
+        segmentation_mask_source = self.config.get('segmentation_masks_source')
+        annotation.metadata['segmentation_masks_source'] = segmentation_mask_source
 
     def _load_meta(self):
         meta_data_file = self._config.get('dataset_meta')
@@ -170,6 +231,11 @@ def _convert_annotation(self):
 
         return annotation, meta
 
+    def reset(self, reload_annotation=False):
+        self.subset = None
+        if reload_annotation:
+            self._load_annotation()
+
 
 def read_annotation(annotation_file: Path):
     annotation_file = get_path(annotation_file)
@@ -186,7 +252,8 @@ def read_annotation(annotation_file: Path):
 
 
 class DatasetWrapper:
-    def __init__(self, data_reader, annotation_reader=None):
+    def __init__(self, data_reader, annotation_reader=None, tag=''):
+        self.tag = tag
         self.data_reader = data_reader
         self.annotation_reader = annotation_reader
         self._batch = 1
@@ -199,32 +266,41 @@ def __getitem__(self, item):
             raise IndexError
         batch_annotation = []
         if self.annotation_reader:
-            batch_annotation = self.annotation_reader[item]
+            batch_annotation_ids, batch_annotation = self.annotation_reader[item]
             batch_identifiers = [annotation.identifier for annotation in batch_annotation]
             batch_input = [self.data_reader(identifier=identifier) for identifier in batch_identifiers]
             for annotation, input_data in zip(batch_annotation, batch_input):
                 set_image_metadata(annotation, input_data)
                 annotation.metadata['data_source'] = self.data_reader.data_source
-            return batch_annotation, batch_input, batch_identifiers
+                segmentation_mask_source = self.annotation_reader.config.get('segmentation_masks_source')
+                annotation.metadata['segmentation_masks_source'] = segmentation_mask_source
+            return batch_annotation_ids, batch_annotation, batch_input, batch_identifiers
         batch_start = item * self.batch
         batch_end = min(self.size, batch_start + self.batch)
-        if self.subset:
-            batch_identifiers = [self._identifiers[idx] for idx in self.subset[batch_start:batch_end]]
-        else:
-            batch_identifiers = self._identifiers[batch_start:batch_end]
+        batch_input_ids = self.subset[batch_start:batch_end] if self.subset else range(batch_start, batch_end)
+        batch_identifiers = [self._identifiers[idx] for idx in batch_input_ids]
         batch_input = [self.data_reader(identifier=identifier) for identifier in batch_identifiers]
 
-        return batch_annotation, batch_input, batch_identifiers
+        return batch_input_ids, batch_annotation, batch_input, batch_identifiers
 
-    def make_subset(self, ids=None, start=0, step=1, end=None):
+    def __len__(self):
         if self.annotation_reader:
-            self.annotation_reader.make_subset(ids, start, step, end)
+            return self.annotation_reader.size
+        if self.subset:
+            return len(self.subset)
+        return len(self._identifiers)
+
+    def make_subset(self, ids=None, start=0, step=1, end=None, accept_pairs=False):
+        if self.annotation_reader:
+            self.annotation_reader.make_subset(ids, start, step, end, accept_pairs)
         if ids:
             self.subset = ids
             return
         if not end:
             end = self.size
         self.subset = range(start, end, step)
+        if self.data_reader.name in REQUIRES_ANNOTATIONS:
+            self.data_reader.subset = self.subset
 
     @property
     def batch(self):
@@ -236,16 +312,19 @@ def batch(self, batch):
             self.annotation_reader.batch = batch
         self._batch = batch
 
-    def reset(self):
+    def reset(self, reload_annotation=False):
         if self.subset:
             self.subset = None
         if self.annotation_reader:
-            self.annotation_reader.subset = None
+            self.annotation_reader.reset(reload_annotation)
+        self.data_reader.reset()
 
     @property
-    def size(self):
+    def full_size(self):
         if self.annotation_reader:
-            return self.annotation_reader.size
-        if self.subset:
-            return len(self.subset)
+            return self.annotation_reader.full_size
         return len(self._identifiers)
+
+    @property
+    def size(self):
+        return self.__len__()
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/__init__.py b/tools/accuracy_checker/accuracy_checker/evaluators/__init__.py
index 765549ea638..30843c3baea 100644
--- a/tools/accuracy_checker/accuracy_checker/evaluators/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/__init__.py
@@ -15,10 +15,15 @@
 """
 
 from .model_evaluator import ModelEvaluator
-from .pipeline_evaluator import PipeLineEvaluator, get_processing_info
+from .pipeline_evaluator import PipeLineEvaluator
+from .module_evaluator import ModuleEvaluator
+from .base_evaluator import BaseEvaluator
+
 
 __all__ = [
     'ModelEvaluator',
     'PipeLineEvaluator',
-    'get_processing_info'
+    'ModuleEvaluator',
+
+    'BaseEvaluator'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/base_evaluator.py b/tools/accuracy_checker/accuracy_checker/evaluators/base_evaluator.py
new file mode 100644
index 00000000000..ee91743fbef
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/base_evaluator.py
@@ -0,0 +1,52 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+
+# base class for custom evaluators
+class BaseEvaluator:
+    # create class instance using config
+    @classmethod
+    def from_configs(cls, config):
+        return cls()
+
+    # extract information related to evaluation from config
+    @staticmethod
+    def get_processing_info(config):
+        return config['name'], 'framework', 'device', None, 'dataset_name'
+
+    # determine cycle for dataset processing
+    def process_dataset(self, *args, **kwargs):
+        raise NotImplementedError
+
+    # finalize and get metrics results
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        raise NotImplementedError
+
+    # delayed metrics results logging
+    def print_metrics_results(self, ignore_results_formatting=False):
+        raise NotImplementedError
+
+    # extract metrics results values prepared for printing
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        raise NotImplementedError
+
+    # destruction for entity, which can not be deleted automatically
+    def release(self):
+        pass
+
+    # reset progress for metrics calculation
+    def reset(self):
+        raise NotImplementedError
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/model_evaluator.py b/tools/accuracy_checker/accuracy_checker/evaluators/model_evaluator.py
index 91951b4d950..2ea0573d02f 100644
--- a/tools/accuracy_checker/accuracy_checker/evaluators/model_evaluator.py
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/model_evaluator.py
@@ -18,20 +18,21 @@
 import copy
 import pickle
 
-from ..utils import get_path, set_image_metadata, extract_image_representations
+from ..utils import get_path, extract_image_representations
 from ..dataset import Dataset
 from ..launcher import create_launcher, DummyLauncher, InputFeeder
 from ..launcher.loaders import PickleLoader
-from ..logging import print_info
+from ..logging import print_info, warning
 from ..metrics import MetricsExecutor
 from ..postprocessor import PostprocessingExecutor
 from ..preprocessor import PreprocessingExecutor
 from ..adapters import create_adapter
 from ..config import ConfigError
-from ..data_readers import BaseReader
+from ..data_readers import BaseReader, REQUIRES_ANNOTATIONS
+from .base_evaluator import BaseEvaluator
 
 
-class ModelEvaluator:
+class ModelEvaluator(BaseEvaluator):
     def __init__(
             self, launcher, input_feeder, adapter, reader, preprocessor, postprocessor, dataset, metric, async_mode
     ):
@@ -50,21 +51,24 @@ def __init__(
         self._metrics_results = []
 
     @classmethod
-    def from_configs(cls, launcher_config, dataset_config):
+    def from_configs(cls, model_config):
+        launcher_config = model_config['launchers'][0]
+        dataset_config = model_config['datasets'][0]
         dataset_name = dataset_config['name']
         data_reader_config = dataset_config.get('reader', 'opencv_imread')
         data_source = dataset_config.get('data_source')
+
         dataset = Dataset(dataset_config)
         if isinstance(data_reader_config, str):
-            data_reader = BaseReader.provide(data_reader_config, data_source, annotations=dataset.annotation)
+            data_reader_type = data_reader_config
+            data_reader_config = None
         elif isinstance(data_reader_config, dict):
-            data_reader = BaseReader.provide(
-                data_reader_config['type'], data_source, data_reader_config, annotations=dataset.annotation
-            )
+            data_reader_type = data_reader_config['type']
         else:
             raise ConfigError('reader should be dict or string')
-
-        dataset = Dataset(dataset_config)
+        if data_reader_type in REQUIRES_ANNOTATIONS:
+            data_source = dataset.annotation
+        data_reader = BaseReader.provide(data_reader_type, data_source, data_reader_config)
         launcher = create_launcher(launcher_config)
         async_mode = launcher.async_mode if hasattr(launcher, 'async_mode') else False
         config_adapter = launcher_config.get('adapter')
@@ -83,12 +87,22 @@ def from_configs(cls, launcher_config, dataset_config):
             preprocessor, postprocessor, dataset, metric_dispatcher, async_mode
         )
 
+    @staticmethod
+    def get_processing_info(config):
+        launcher_config = config['launchers'][0]
+        dataset_config = config['datasets'][0]
+
+        return (
+            config['name'],
+            launcher_config['framework'], launcher_config['device'], launcher_config.get('tags'),
+            dataset_config['name']
+        )
+
     def _get_batch_input(self, batch_annotation):
         batch_identifiers = [annotation.identifier for annotation in batch_annotation]
         batch_input = [self.reader(identifier=identifier) for identifier in batch_identifiers]
         for annotation, input_data in zip(batch_annotation, batch_input):
-            set_image_metadata(annotation, input_data)
-            annotation.metadata['data_source'] = self.reader.data_source
+            self.dataset.set_annotation_metadata(annotation, input_data, self.reader.data_source)
         batch_input = self.preprocessor.process(batch_input, batch_annotation)
         _, batch_meta = extract_image_representations(batch_input)
         filled_inputs = self.input_feeder.fill_inputs(batch_input)
@@ -99,17 +113,21 @@ def process_dataset_async(self, stored_predictions, progress_reporter, *args, **
         def _process_ready_predictions(batch_predictions, batch_identifiers, batch_meta, adapter, raw_outputs_callback):
             if raw_outputs_callback:
                 raw_outputs_callback(
-                    [batch_predictions], network=self.launcher.network, exec_network=self.launcher.exec_network
+                    batch_predictions, network=self.launcher.network, exec_network=self.launcher.exec_network
                 )
             if adapter:
                 batch_predictions = self.adapter.process(batch_predictions, batch_identifiers, batch_meta)
 
             return batch_predictions
 
+        self.dataset.batch = self.launcher.batch
+        if self.launcher.allow_reshape_input or self.preprocessor.has_multi_infer_transformations:
+            warning('Model can not to be processed in async mode. Switched to sync.')
+            return self.process_dataset(stored_predictions, progress_reporter, *args, **kwargs)
+
         if self._is_stored(stored_predictions) or isinstance(self.launcher, DummyLauncher):
             self._annotations, self._predictions = self._load_stored_predictions(stored_predictions, progress_reporter)
 
-        self.dataset.batch = self.launcher.batch
         predictions_to_store = []
         dataset_iterator = iter(enumerate(self.dataset))
         free_irs = self.launcher.infer_requests
@@ -123,21 +141,23 @@ def _process_ready_predictions(batch_predictions, batch_identifiers, batch_meta,
             ready_irs, queued_irs = self._wait_for_any(queued_irs)
             if ready_irs:
                 wait_time = 0.01
-                for batch_id, batch_annotation, batch_meta, batch_predictions, ir in ready_irs:
+                while ready_irs:
+                    ready_data = ready_irs.pop(0)
+                    batch_id, batch_input_ids, batch_annotation, batch_meta, batch_raw_predictions, ir = ready_data
                     batch_identifiers = [annotation.identifier for annotation in batch_annotation]
                     batch_predictions = _process_ready_predictions(
-                        batch_predictions, batch_identifiers, batch_meta, self.adapter, kwargs.get('output_callback')
+                        batch_raw_predictions, batch_identifiers, batch_meta, self.adapter,
+                        kwargs.get('raw_outputs_callback')
                     )
                     free_irs.append(ir)
                     if stored_predictions:
                         predictions_to_store.extend(copy.deepcopy(batch_predictions))
                     annotations, predictions = self.postprocessor.process_batch(batch_annotation, batch_predictions)
+                    self.metric_executor.update_metrics_on_batch(batch_input_ids, annotations, predictions)
 
-                    if not self.postprocessor.has_dataset_processors:
-                        self.metric_executor.update_metrics_on_batch(annotations, predictions)
-
-                    self._annotations.extend(annotations)
-                    self._predictions.extend(predictions)
+                    if self.metric_executor.need_store_predictions:
+                        self._annotations.extend(annotations)
+                        self._predictions.extend(predictions)
 
                     if progress_reporter:
                         progress_reporter.update(batch_id, len(batch_predictions))
@@ -152,24 +172,28 @@ def _process_ready_predictions(batch_predictions, batch_identifiers, batch_meta,
         if stored_predictions:
             self.store_predictions(stored_predictions, predictions_to_store)
 
-        if self.postprocessor.has_dataset_processors:
-            self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
-
-        return self.postprocessor.process_dataset(self._annotations, self._predictions)
-
     def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs):
+        if progress_reporter:
+            progress_reporter.reset(self.dataset.size)
         if self._is_stored(stored_predictions) or isinstance(self.launcher, DummyLauncher):
             self._annotations, self._predictions = self.load(stored_predictions, progress_reporter)
             self._annotations, self._predictions = self.postprocessor.full_process(self._annotations, self._predictions)
 
-            self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
+            self.metric_executor.update_metrics_on_batch(
+                range(len(self._annotations)), self._annotations, self._predictions
+            )
             return self._annotations, self._predictions
 
         self.dataset.batch = self.launcher.batch
+        raw_outputs_callback = kwargs.get('output_callback')
         predictions_to_store = []
-        for batch_id, batch_annotation in enumerate(self.dataset):
+        for batch_id, (batch_input_ids, batch_annotation) in enumerate(self.dataset):
             filled_inputs, batch_meta, batch_identifiers = self._get_batch_input(batch_annotation)
             batch_predictions = self.launcher.predict(filled_inputs, batch_meta, **kwargs)
+            if raw_outputs_callback:
+                raw_outputs_callback(
+                    batch_predictions, network=self.launcher.network, exec_network=self.launcher.exec_network
+                )
             if self.adapter:
                 self.adapter.output_blob = self.adapter.output_blob or self.launcher.output_blob
                 batch_predictions = self.adapter.process(batch_predictions, batch_identifiers, batch_meta)
@@ -179,10 +203,11 @@ def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs
 
             annotations, predictions = self.postprocessor.process_batch(batch_annotation, batch_predictions, batch_meta)
             if not self.postprocessor.has_dataset_processors:
-                self.metric_executor.update_metrics_on_batch(annotations, predictions)
+                self.metric_executor.update_metrics_on_batch(batch_input_ids, annotations, predictions)
 
-            self._annotations.extend(annotations)
-            self._predictions.extend(predictions)
+            if self.metric_executor.need_store_predictions:
+                self._annotations.extend(annotations)
+                self._predictions.extend(predictions)
 
             if progress_reporter:
                 progress_reporter.update(batch_id, len(batch_predictions))
@@ -194,7 +219,9 @@ def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs
             self.store_predictions(stored_predictions, predictions_to_store)
 
         if self.postprocessor.has_dataset_processors:
-            self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
+            self.metric_executor.update_metrics_on_batch(
+                range(len(self._annotations)), self._annotations, self._predictions
+            )
 
         return self.postprocessor.process_dataset(self._annotations, self._predictions)
 
@@ -212,7 +239,9 @@ def _is_stored(stored_predictions=None):
     def _load_stored_predictions(self, stored_predictions, progress_reporter):
         self._annotations, self._predictions = self.load(stored_predictions, progress_reporter)
         self._annotations, self._predictions = self.postprocessor.full_process(self._annotations, self._predictions)
-        self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
+        self.metric_executor.update_metrics_on_batch(
+            range(len(self._annotations)), self._annotations, self._predictions
+        )
 
         return self._annotations, self._predictions
 
@@ -221,29 +250,32 @@ def _wait_for_any(irs):
         if not irs:
             return [], []
 
-        result = []
         free_indexes = []
-        for ir_id, (batch_id, batch_annotation, batch_meta, ir) in enumerate(irs):
+        for ir_id, (_, _, _, _, ir) in enumerate(irs):
             if ir.wait(0) == 0:
-                result.append((batch_id, batch_annotation, batch_meta, [ir.outputs], ir))
                 free_indexes.append(ir_id)
-        irs = [ir for ir_id, ir in enumerate(irs) if ir_id not in free_indexes]
+        result = []
+        free_indexes.sort(reverse=True)
+        for idx in free_indexes:
+            batch_id, batch_input_ids, batch_annotation, batch_meta, ir = irs.pop(idx)
+            result.append((batch_id, batch_input_ids, batch_annotation, batch_meta, ir.outputs, ir))
+
         return result, irs
 
     def _fill_free_irs(self, free_irs, queued_irs, dataset_iterator):
         for ir in free_irs:
             try:
-                batch_id, batch_annotation = next(dataset_iterator)
+                batch_id, (batch_input_ids, batch_annotation) = next(dataset_iterator)
             except StopIteration:
                 break
 
             batch_input, batch_meta, _ = self._get_batch_input(batch_annotation)
             self.launcher.predict_async(ir, batch_input, batch_meta)
-            queued_irs.append((batch_id, batch_annotation, batch_meta, ir))
+            queued_irs.append((batch_id, batch_input_ids, batch_annotation, batch_meta, ir))
 
         return free_irs, queued_irs
 
-    def compute_metrics(self, print_results=True, output_callback=None, ignore_results_formatting=False):
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
         if self._metrics_results:
             del self._metrics_results
             self._metrics_results = []
@@ -252,16 +284,35 @@ def compute_metrics(self, print_results=True, output_callback=None, ignore_resul
                 self._annotations, self._predictions):
             self._metrics_results.append(evaluated_metric)
             if print_results:
-                result_presenter.write_result(evaluated_metric, output_callback, ignore_results_formatting)
+                result_presenter.write_result(evaluated_metric, ignore_results_formatting)
         return self._metrics_results
 
-    def print_metrics_results(self, output_callback=None, ignore_results_formatting=False):
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
         if not self._metrics_results:
-            self.compute_metrics(True, output_callback, ignore_results_formatting)
+            self.compute_metrics(False, ignore_results_formatting)
+
+        result_presenters = self.metric_executor.get_metric_presenters()
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
             return
         result_presenters = self.metric_executor.get_metric_presenters()
         for presenter, metric_result in zip(result_presenters, self._metrics_results):
-            presenter.write_results(metric_result, output_callback, ignore_results_formatting)
+            presenter.write_result(metric_result, ignore_results_formatting)
 
     def load(self, stored_predictions, progress_reporter):
         self._annotations = self.dataset.annotation
@@ -294,6 +345,9 @@ def store_predictions(stored_predictions, predictions):
             pickle.dump(predictions, content)
             print_info("prediction objects are save to {}".format(stored_predictions))
 
+    def reset_progress(self, progress_reporter):
+        progress_reporter.reset(self.dataset.size)
+
     def reset(self):
         self.metric_executor.reset()
         del self._annotations
@@ -302,6 +356,8 @@ def reset(self):
         self._annotations = []
         self._predictions = []
         self._metrics_results = []
+        self.dataset.reset(self.postprocessor.has_processors)
+        self.reader.reset()
 
     def release(self):
         self.launcher.release()
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/module_evaluator.py b/tools/accuracy_checker/accuracy_checker/evaluators/module_evaluator.py
new file mode 100644
index 00000000000..7913344369a
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/module_evaluator.py
@@ -0,0 +1,63 @@
+from contextlib import contextmanager
+import sys
+import importlib
+
+from .base_evaluator import BaseEvaluator
+
+
+class ModuleEvaluator(BaseEvaluator):
+    def __init__(self, internal_module):
+        super().__init__()
+        self._internal_module = internal_module
+
+    @classmethod
+    def from_configs(cls, config):
+        module = config['module']
+        module_config = config.get('module_config')
+        python_path = config.get('python_path')
+
+        return cls(load_module(module, python_path).from_configs(module_config))
+
+    def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs):
+        self._internal_module.process_dataset(stored_predictions, progress_reporter, *args, **kwargs)
+
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        return self._internal_module.compute_metrics(print_results, ignore_results_formatting)
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        self._internal_module.print_metrics(ignore_results_formatting)
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        return self._internal_module.extract_metrics_results(print_results, ignore_results_formatting)
+
+    def release(self):
+        self._internal_module.release()
+        del self._internal_module
+
+    def reset(self):
+        self._internal_module.reset()
+
+    @staticmethod
+    def get_processing_info(config):
+        module = config['module']
+        python_path = config.get('python_path')
+        return load_module(module, python_path).get_processing_info(config)
+
+
+def load_module(model_cls, python_path=None):
+    module_parts = model_cls.split(".")
+    model_cls = module_parts[-1]
+    model_path = ".".join(module_parts[:-1])
+    with append_to_path(python_path):
+        module_cls = importlib.import_module(model_path).__getattribute__(model_cls)
+        return module_cls
+
+
+@contextmanager
+def append_to_path(path):
+    if path:
+        sys.path.append(path)
+    yield
+
+    if path:
+        sys.path.remove(path)
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/pipeline_evaluator.py b/tools/accuracy_checker/accuracy_checker/evaluators/pipeline_evaluator.py
index 4357ac65b16..e8f11dbfc3e 100644
--- a/tools/accuracy_checker/accuracy_checker/evaluators/pipeline_evaluator.py
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/pipeline_evaluator.py
@@ -26,7 +26,8 @@
 from ..metrics import MetricsExecutor
 from ..pipeline_connectors import StageConnectionDescription, Connection
 from ..postprocessor import PostprocessingExecutor
-from..preprocessor import PreprocessingExecutor
+from ..preprocessor import PreprocessingExecutor
+from .base_evaluator import BaseEvaluator
 
 
 def get_processing_info(pipeline_config):
@@ -145,6 +146,7 @@ def __init__(self, dataset, metric_executor=None, launcher=None):
         self.predictions = []
         self.annotation_batch = []
         self.prediction_batch = []
+        self.input_ids_batch = []
         self.data_batch = []
         self.metrics_results = []
         self.identifiers_batch = []
@@ -161,7 +163,8 @@ def shared_context(self):
             'annotation_batch': self.annotation_batch,
             'prediction_batch': self.prediction_batch,
             'data_batch': self.data_batch,
-            'identifiers_batch': self.identifiers_batch
+            'identifiers_batch': self.identifiers_batch,
+            'input_ids_batch': self.input_ids_batch
         }
         return _shared_context
 
@@ -177,21 +180,39 @@ def reset(self):
             self.metrics_executor.reset()
 
 
-class PipeLineEvaluator:
+class PipeLineEvaluator(BaseEvaluator):
     def __init__(self, stages):
         self.stages = stages
         self.create_connectors()
         self.context = next(iter(stages.values())).evaluation_context
+        self._metrics_results = []
+        self._metrics_result_presenters = []
 
     @classmethod
     def from_configs(cls, pipeline_config):
         stages = OrderedDict()
-        for stage_config in pipeline_config:
+        for stage_config in pipeline_config['stages']:
             stage_name = stage_config['stage']
             evaluation_stage = PipeLineStage.from_configs(stage_name, stage_config)
             stages[stage_name] = evaluation_stage
         return cls(stages)
 
+    @staticmethod
+    def get_processing_info(config):
+        name = config['name']
+        stages = config['stages']
+        dataset_name = stages[0]['dataset']['name']
+        launcher = {}
+        for stage in stages:
+            if 'launcher' in stage:
+                launcher = stage['launcher']
+                break
+        framework = launcher.get('framework')
+        device = launcher.get('device')
+        tags = launcher.get('tags')
+
+        return name, framework, device, tags, dataset_name
+
     def create_connectors(self):
         def make_connection(stages, connection_template):
             return Connection(stages, connection_template)
@@ -224,18 +245,55 @@ def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs
         if progress_reporter:
             progress_reporter.finish()
 
-    def compute_metrics(self, output_callback=None, ignore_results_formatting=False):
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
         def eval_metrics(metrics_executor, annotations, predictions):
             for result_presenter, evaluated_metric in metrics_executor.iterate_metrics(annotations, predictions):
-                result_presenter.write_result(evaluated_metric, output_callback, ignore_results_formatting)
+                self._metrics_results.append(evaluated_metric)
+                self._metrics_result_presenters.append(result_presenter)
+                if print_results:
+                    result_presenter.write_result(evaluated_metric, ignore_results_formatting)
+
+        if self._metrics_results:
+            del self._metrics_results
+            self._metrics_results = []
+            self._metrics_result_presenters = []
 
         for _, stage in self.stages.items():
             metrics_executors = stage.evaluation_context.metrics_executor
             for metrics_executor in metrics_executors:
                 eval_context = stage.evaluation_context
                 eval_metrics(metrics_executor, eval_context.annotations, eval_context.predictions)
+        return self._metrics_results
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
+        for presenter, metric_result in zip(self._metrics_result_presenters, self._metrics_results):
+            presenter.write_result(metric_result, ignore_results_formatting)
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(False, ignore_results_formatting)
+
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(self._metrics_result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
 
     def release(self):
         for _, stage in self.stages.items():
             for launcher in stage.evaluation_context.launcher:
                 launcher.release()
+
+    def reset(self):
+        for _, stage in self.stages.items():
+            stage.evaluation_context.reset()
diff --git a/tools/accuracy_checker/accuracy_checker/evaluators/quantization_model_evaluator.py b/tools/accuracy_checker/accuracy_checker/evaluators/quantization_model_evaluator.py
index d869b3987d6..3e435f8dbf2 100644
--- a/tools/accuracy_checker/accuracy_checker/evaluators/quantization_model_evaluator.py
+++ b/tools/accuracy_checker/accuracy_checker/evaluators/quantization_model_evaluator.py
@@ -16,72 +16,50 @@
 
 import time
 import copy
+import numpy as np
 
 from ..utils import extract_image_representations, contains_any
 from ..dataset import Dataset, DatasetWrapper
 from ..launcher import create_launcher, InputFeeder
+from ..logging import warning
 from ..metrics import MetricsExecutor
 from ..postprocessor import PostprocessingExecutor
 from ..preprocessor import PreprocessingExecutor
 from ..adapters import create_adapter
 from ..config import ConfigError
-from ..data_readers import BaseReader
-from ..statistics_collector import StatisticsCollector
+from ..data_readers import BaseReader, REQUIRES_ANNOTATIONS
 from ..progress_reporters import ProgressReporter
 
 
 class ModelEvaluator:
     def __init__(
-            self, launcher, input_feeder, adapter, dataset, preprocessor, postprocessor, metric
+            self, launcher, adapter, dataset_config
     ):
         self.launcher = launcher
-        self.input_feeder = input_feeder
+        self.input_feeder = None
         self.adapter = adapter
-        self.dataset = dataset
-        self.preprocessor = preprocessor
-        self.postprocessor = postprocessor
-        self.metric_executor = metric
-        self.stat_collector = None
+        self.dataset_config = dataset_config
+        self.preprocessor = None
+        self.dataset = None
+        self.postprocessor = None
+        self.metric_executor = None
 
         self._annotations = []
         self._predictions = []
+        self._input_ids = []
         self._metrics_results = []
 
     @classmethod
     def from_configs(cls, config):
         model_config = config['models'][0]
-        dataset_config = model_config['datasets'][0]
+        dataset_config = model_config['datasets']
         launcher_config = model_config['launchers'][0]
-        dataset_name = dataset_config['name']
-        data_reader_config = dataset_config.get('reader', 'opencv_imread')
-        data_source = dataset_config.get('data_source')
-
-        if isinstance(data_reader_config, str):
-            data_reader = BaseReader.provide(data_reader_config, data_source)
-        elif isinstance(data_reader_config, dict):
-            data_reader = BaseReader.provide(data_reader_config['type'], data_source, data_reader_config)
-        else:
-            raise ConfigError('reader should be dict or string')
-        annotation_reader = None
-        dataset_meta = {}
-        metric_dispatcher = None
-        if contains_any(dataset_config, ['annotation', 'annotation_conversion']):
-            annotation_reader = Dataset(dataset_config)
-            dataset_meta = annotation_reader.metadata
-        dataset = DatasetWrapper(data_reader, annotation_reader)
         launcher = create_launcher(launcher_config, delayed_model_loading=True)
         config_adapter = launcher_config.get('adapter')
-        adapter = None if not config_adapter else create_adapter(config_adapter, None, annotation_reader)
-        preprocessor = PreprocessingExecutor(
-            dataset_config.get('preprocessing'), dataset_name, dataset_meta
-        )
-        postprocessor = PostprocessingExecutor(dataset_config.get('postprocessing'), dataset_name, dataset_meta)
-        if 'metrics' in dataset_config:
-            metric_dispatcher = MetricsExecutor(dataset_config.get('metrics', []), annotation_reader)
+        adapter = None if not config_adapter else create_adapter(config_adapter, None, None)
 
         return cls(
-            launcher, None, adapter, dataset,
-            preprocessor, postprocessor, metric_dispatcher
+            launcher, adapter, dataset_config
         )
 
     def _get_batch_input(self, batch_input, batch_annotation):
@@ -93,44 +71,55 @@ def _get_batch_input(self, batch_input, batch_annotation):
 
     def process_dataset_async(
             self,
-            nreq=2,
-            statistics_functors_maping=None,
+            nreq=None,
             subset=None,
             num_images=None,
             check_progress=False,
+            dataset_tag='',
+            output_callback=None,
+            allow_pairwise_subset=False,
             **kwargs
     ):
-        def _process_ready_predictions(batch_predictions, batch_identifiers, batch_meta, adapter, raw_outputs_callback):
-            if self.stat_collector:
-                self.stat_collector.process_batch(batch_predictions)
-            if raw_outputs_callback:
-                raw_outputs_callback(batch_predictions)
+
+        def _process_ready_predictions(batch_raw_predictions, batch_identifiers, batch_meta, adapter):
             if adapter:
-                batch_predictions = self.adapter.process(batch_predictions, batch_identifiers, batch_meta)
+                return self.adapter.process(batch_raw_predictions, batch_identifiers, batch_meta)
 
-            return batch_predictions
+            return batch_raw_predictions
 
         def _create_subset(subset, num_images):
             if subset is not None:
-                self.dataset.make_subset(ids=subset)
+                self.dataset.make_subset(ids=subset, accept_pairs=allow_pairwise_subset)
             elif num_images is not None:
-                self.dataset.make_subset(end=num_images)
+                self.dataset.make_subset(end=num_images, accept_pairs=allow_pairwise_subset)
+
+        def _set_number_infer_requests(nreq):
+            if nreq is None:
+                nreq = self.launcher.auto_num_requests()
+            if self.launcher.num_requests != nreq:
+                self.launcher.num_requests = nreq
+
+        if self.dataset is None or (dataset_tag and self.dataset.tag != dataset_tag):
+            self.select_dataset(dataset_tag)
+
+        if self.launcher.allow_reshape_input or self.preprocessor.has_multi_infer_transformations:
+            warning('Model can not to be processed in async mode. Switched to sync.')
+            return self.process_dataset(
+                subset, num_images, check_progress, dataset_tag, output_callback, allow_pairwise_subset, **kwargs
+            )
+        _set_number_infer_requests(nreq)
 
         self.dataset.batch = self.launcher.batch
-        self.stat_collector = None
+        self.preprocessor.input_shapes = self.launcher.inputs_info_for_meta()
         progress_reporter = None
 
         _create_subset(subset, num_images)
 
         if check_progress:
-            progress_reporter = ProgressReporter.provide('print', self.dataset.size)
+            progress_reporter = self._create_progress_reporter(check_progress, self.dataset.size)
 
         dataset_iterator = iter(enumerate(self.dataset))
-        if self.launcher.num_requests != nreq:
-            self.launcher.num_requests = nreq
 
-        if statistics_functors_maping:
-            self.stat_collector = StatisticsCollector(statistics_functors_maping, self.launcher.batch)
         free_irs = self.launcher.infer_requests
         queued_irs = []
         wait_time = 0.01
@@ -142,18 +131,41 @@ def _create_subset(subset, num_images):
             ready_irs, queued_irs = self._wait_for_any(queued_irs)
             if ready_irs:
                 wait_time = 0.01
-                for batch_id, batch_annotation, batch_identifiers, batch_meta, batch_predictions, ir in ready_irs:
+                while ready_irs:
+                    ready_data = ready_irs.pop(0)
+                    (
+                        batch_id,
+                        batch_input_ids,
+                        batch_annotation,
+                        batch_identifiers,
+                        batch_meta,
+                        batch_raw_predictions,
+                        ir
+                    ) = ready_data
                     batch_predictions = _process_ready_predictions(
-                        batch_predictions, batch_identifiers, batch_meta, self.adapter, kwargs.get('output_callback')
+                        batch_raw_predictions, batch_identifiers, batch_meta, self.adapter
                     )
                     free_irs.append(ir)
-                    annotations, predictions = self.postprocessor.process_batch(batch_annotation, batch_predictions)
+                    annotations, predictions = self.postprocessor.process_batch(
+                        batch_annotation, batch_predictions, batch_meta
+                    )
 
-                    if not self.postprocessor.has_dataset_processors and self.metric_executor:
-                        self.metric_executor.update_metrics_on_batch(annotations, predictions)
-
-                    self._annotations.extend(annotations)
-                    self._predictions.extend(predictions)
+                    metrics_result = None
+                    if self.metric_executor:
+                        metrics_result = self.metric_executor.update_metrics_on_batch(
+                            batch_input_ids, annotations, predictions
+                        )
+                        if self.metric_executor.need_store_predictions:
+                            self._annotations.extend(annotations)
+                            self._predictions.extend(predictions)
+
+                    if output_callback:
+                        output_callback(
+                            batch_raw_predictions,
+                            metrics_result=metrics_result,
+                            element_identifiers=batch_identifiers,
+                            dataset_indices=batch_input_ids
+                        )
 
                     if progress_reporter:
                         progress_reporter.update(batch_id, len(batch_predictions))
@@ -161,97 +173,127 @@ def _create_subset(subset, num_images):
                 time.sleep(wait_time)
                 wait_time = max(wait_time * 2, .16)
 
-        if self.postprocessor.has_dataset_processors:
-            self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
-
         if progress_reporter:
             progress_reporter.finish()
 
-        return self.postprocessor.process_dataset(self._annotations, self._predictions)
+    def select_dataset(self, dataset_tag):
+        if self.dataset is not None and isinstance(self.dataset_config, list):
+            return
+        dataset_attributes = create_dataset_attributes(self.dataset_config, dataset_tag)
+        self.dataset, self.metric_executor, self.preprocessor, self.postprocessor = dataset_attributes
+        if self.dataset.annotation_reader and self.dataset.annotation_reader.metadata:
+            self.adapter.label_map = self.dataset.annotation_reader.metadata.get('label_map')
 
     def process_dataset(
             self,
-            statistics_functors_maping=None,
             subset=None,
             num_images=None,
             check_progress=False,
+            dataset_tag='',
+            output_callback=None,
+            allow_pairwise_subset=False,
             **kwargs
     ):
+        def _create_subset(subset, num_images):
+            if subset is not None:
+                self.dataset.make_subset(ids=subset, accept_pairs=allow_pairwise_subset)
+            elif num_images is not None:
+                self.dataset.make_subset(end=num_images, accept_pairs=allow_pairwise_subset)
+
+        if self.dataset is None or (dataset_tag and self.dataset.tag != dataset_tag):
+            self.select_dataset(dataset_tag)
         self.dataset.batch = self.launcher.batch
+        self.preprocessor.input_shapes = self.launcher.inputs_info_for_meta()
         progress_reporter = None
 
-        if statistics_functors_maping:
-            self.stat_collector = StatisticsCollector(statistics_functors_maping, self.launcher.batch)
-
-        if subset is not None:
-            self.dataset.make_subset(ids=subset)
-
-        elif num_images is not None:
-            self.dataset.make_subset(end=num_images)
+        _create_subset(subset, num_images)
 
         if check_progress:
-            progress_reporter = ProgressReporter.provide('print', self.dataset.size)
+            progress_reporter = self._create_progress_reporter(check_progress, self.dataset.size)
 
-        for batch_id, (batch_annotation, batch_inputs, batch_identifiers) in enumerate(self.dataset):
+        for batch_id, (batch_input_ids, batch_annotation, batch_inputs, batch_identifiers) in enumerate(self.dataset):
             filled_inputs, batch_meta = self._get_batch_input(batch_inputs, batch_annotation)
-            batch_predictions = self.launcher.predict(filled_inputs, batch_meta, **kwargs)
-            if self.stat_collector:
-                self.stat_collector.process_batch(batch_predictions)
+            batch_raw_predictions = self.launcher.predict(filled_inputs, batch_meta, **kwargs)
             if self.adapter:
                 self.adapter.output_blob = self.adapter.output_blob or self.launcher.output_blob
-                batch_predictions = self.adapter.process(batch_predictions, batch_identifiers, batch_meta)
+                batch_predictions = self.adapter.process(batch_raw_predictions, batch_identifiers, batch_meta)
+            else:
+                batch_predictions = batch_raw_predictions
 
             annotations, predictions = self.postprocessor.process_batch(batch_annotation, batch_predictions, batch_meta)
-            if not self.postprocessor.has_dataset_processors and self.metric_executor:
-                self.metric_executor.update_metrics_on_batch(annotations, predictions)
+            metrics_result = None
+            if self.metric_executor:
+                metrics_result = self.metric_executor.update_metrics_on_batch(batch_input_ids, annotations, predictions)
+                if self.metric_executor.need_store_predictions:
+                    self._annotations.extend(annotations)
+                    self._predictions.extend(predictions)
 
-            self._annotations.extend(annotations)
-            self._predictions.extend(predictions)
+            if output_callback:
+                if isinstance(batch_raw_predictions, list) and len(batch_raw_predictions) == 1:
+                    batch_raw_predictions = batch_raw_predictions[0]
+                output_callback(
+                    batch_raw_predictions,
+                    metrics_result=metrics_result,
+                    element_identifiers=batch_identifiers,
+                    dataset_indices=batch_input_ids
+                )
 
             if progress_reporter:
                 progress_reporter.update(batch_id, len(batch_predictions))
 
-        if self.postprocessor.has_dataset_processors and self.metric_executor:
-            self.metric_executor.update_metrics_on_batch(self._annotations, self._predictions)
-
         if progress_reporter:
             progress_reporter.finish()
 
-        return self.postprocessor.process_dataset(self._annotations, self._predictions)
-
     @staticmethod
     def _wait_for_any(irs):
         if not irs:
             return [], []
 
-        result = []
         free_indexes = []
-        for ir_id, (batch_id, batch_annotation, batch_identifiers, batch_meta, ir) in enumerate(irs):
+        for ir_id, (_, _, _, _, _, ir) in enumerate(irs):
             if ir.wait(0) == 0:
-                result.append((batch_id, batch_annotation, batch_identifiers, batch_meta, ir.outputs, ir))
                 free_indexes.append(ir_id)
-        irs = [ir for ir_id, ir in enumerate(irs) if ir_id not in free_indexes]
+        result = []
+        free_indexes.sort(reverse=True)
+        for idx in free_indexes:
+            batch_id, batch_input_ids, batch_annotation, batch_identifiers, batch_meta, ir = irs.pop(idx)
+            result.append((batch_id, batch_input_ids, batch_annotation, batch_identifiers, batch_meta, ir.outputs, ir))
+
         return result, irs
 
     def _fill_free_irs(self, free_irs, queued_irs, dataset_iterator, **kwargs):
         for ir in free_irs:
             try:
-                batch_id, (batch_annotation, batch_inputs, batch_identifiers) = next(dataset_iterator)
+                batch_id, (batch_input_ids, batch_annotation, batch_inputs, batch_identifiers) = next(dataset_iterator)
             except StopIteration:
                 break
 
             batch_input, batch_meta = self._get_batch_input(batch_inputs, batch_annotation)
             self.launcher.predict_async(ir, batch_input, batch_meta, **kwargs)
-            queued_irs.append((batch_id, batch_annotation, batch_identifiers, batch_meta, ir))
+            queued_irs.append((batch_id, batch_input_ids, batch_annotation, batch_identifiers, batch_meta, ir))
 
         return free_irs, queued_irs
 
+    @staticmethod
+    def _create_progress_reporter(check_progress, dataset_size):
+        pr_kwargs = {}
+        if isinstance(check_progress, int) and not isinstance(check_progress, bool):
+            pr_kwargs = {"print_interval": check_progress}
+
+        return ProgressReporter.provide('print', dataset_size, **pr_kwargs)
+
     def compute_metrics(self, print_results=True, ignore_results_formatting=False):
         if not self.metric_executor:
             return []
         if self._metrics_results:
             del self._metrics_results
             self._metrics_results = []
+        if self._input_ids:
+            indexes = np.argsort(self._input_ids)
+            annotations = [self._annotations[idx] for idx in indexes]
+            predictions = [self._predictions[idx] for idx in indexes]
+            self._annotations = annotations
+            self._predictions = predictions
 
         for result_presenter, evaluated_metric in self.metric_executor.iterate_metrics(
                 self._annotations, self._predictions):
@@ -266,7 +308,26 @@ def print_metrics_results(self, ignore_results_formatting=False):
             return
         result_presenters = self.metric_executor.get_metric_presenters()
         for presenter, metric_result in zip(result_presenters, self._metrics_results):
-            presenter.write_results(metric_result, ignore_results_formatting)
+            presenter.write_result(metric_result, ignore_results_formatting)
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(False, ignore_results_formatting)
+
+        result_presenters = self.metric_executor.get_metric_presenters()
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
 
     @property
     def metrics_results(self):
@@ -296,21 +357,83 @@ def load_network_from_ir(self, xml_path, bin_path):
     def get_network(self):
         return self.launcher.network
 
-    def get_statistics(self):
-        if not self.stat_collector:
-            return None
-        return self.stat_collector.get_statistics()
+    def get_metrics_attributes(self):
+        if not self.metric_executor:
+            return {}
+        return self.metric_executor.get_metrics_attributes()
+
+    def register_metric(self, metric_config):
+        if isinstance(metric_config, str):
+            self.metric_executor.register_metric({'type': metric_config})
+        elif isinstance(metric_config, dict):
+            self.metric_executor.register_metric(metric_config)
+        else:
+            raise ValueError('Unsupported metric configuration type {}'.format(type(metric_config)))
+
+    def register_postprocessor(self, postprocessing_config):
+        if isinstance(postprocessing_config, str):
+            self.postprocessor.register_postprocessor({'type': postprocessing_config})
+        elif isinstance(postprocessing_config, dict):
+            self.postprocessor.register_postprocessor(postprocessing_config)
+        else:
+            raise ValueError('Unsupported post-processor configuration type {}'.format(type(postprocessing_config)))
 
     def reset(self):
         if self.metric_executor:
             self.metric_executor.reset()
         del self._annotations
         del self._predictions
+        del self._input_ids
         del self._metrics_results
         self._annotations = []
         self._predictions = []
+        self._input_ids = []
         self._metrics_results = []
-        self.dataset.reset()
+        if self.dataset:
+            self.dataset.reset(self.postprocessor.has_processors)
 
     def release(self):
         self.launcher.release()
+
+
+def create_dataset_attributes(config, tag):
+    if isinstance(config, list):
+        dataset_config = config[0]
+    elif isinstance(config, dict):
+        dataset_config = config.get(tag)
+        if not dataset_config:
+            raise ConfigError('suitable dataset for *{}* not found'.format(tag))
+    else:
+        raise TypeError('unknown type for config, dictionary or list must be')
+
+    dataset_name = dataset_config['name']
+    data_reader_config = dataset_config.get('reader', 'opencv_imread')
+    data_source = dataset_config.get('data_source')
+    annotation_reader = None
+    dataset_meta = {}
+    if contains_any(dataset_config, ['annotation', 'annotation_conversion']):
+        annotation_reader = Dataset(dataset_config)
+        dataset_meta = annotation_reader.metadata
+    if isinstance(data_reader_config, str):
+        data_reader_type = data_reader_config
+        data_reader_config = None
+    elif isinstance(data_reader_config, dict):
+        data_reader_type = data_reader_config['type']
+    else:
+        raise ConfigError('reader should be dict or string')
+    if data_reader_type in REQUIRES_ANNOTATIONS:
+        if annotation_reader is None:
+            raise ConfigError('data reader *{}* requires annotation'.format(data_reader_type))
+        data_source = annotation_reader.annotation
+    data_reader = BaseReader.provide(data_reader_type, data_source, data_reader_config)
+
+    metric_dispatcher = None
+    dataset = DatasetWrapper(data_reader, annotation_reader)
+    preprocessor = PreprocessingExecutor(
+        dataset_config.get('preprocessing'), dataset_name, dataset_meta
+    )
+    postprocessor = PostprocessingExecutor(dataset_config.get('postprocessing'), dataset_name, dataset_meta)
+    if 'metrics' in dataset_config:
+        metric_dispatcher = MetricsExecutor(dataset_config.get('metrics', []), annotation_reader)
+
+    return dataset, metric_dispatcher, preprocessor, postprocessor
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/__init__.py b/tools/accuracy_checker/accuracy_checker/launcher/__init__.py
index c7c87e30c8f..47c9d02f6e0 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/__init__.py
@@ -29,7 +29,7 @@
     from .mxnet_launcher import MxNetLauncher
 except ImportError as import_error:
     MxNetLauncher = unsupported_launcher(
-        'mxnet', "MxNet isn't installed. Please, install it before using.\n{}".format(import_error.msg)
+        'mxnet', "MXNet isn't installed. Please, install it before using.\n{}".format(import_error.msg)
     )
 
 try:
@@ -62,6 +62,8 @@
         'onnx_runtime', "ONNX Runtime isn't installed. Please, install it before using. \n{}".format(import_error.msg)
     )
 
+from .pytorch_launcher import PyTorchLauncher
+
 __all__ = [
     'create_launcher',
     'Launcher',
@@ -72,6 +74,7 @@
     'DLSDKLauncher',
     'OpenCVLauncher',
     'ONNXLauncher',
+    'PyTorchLauncher',
     'DummyLauncher',
     'InputFeeder'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher.py
index 6c5c681fa1d..7f6a81b3c03 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher.py
@@ -35,13 +35,17 @@ class CaffeLauncher(Launcher):
     def __init__(self, config_entry: dict, *args, **kwargs):
         super().__init__(config_entry, *args, **kwargs)
 
-        caffe_launcher_config = LauncherConfigValidator('Caffe_Launcher', fields=self.parameters())
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
+        caffe_launcher_config = LauncherConfigValidator(
+            'Caffe_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading
+        )
         caffe_launcher_config.validate(self.config)
+        self._do_reshape = False
 
-        self.model = str(self.get_value_from_config('model'))
-        self.weights = str(self.get_value_from_config('weights'))
-
-        self.network = caffe.Net(self.model, self.weights, caffe.TEST)
+        if not self._delayed_model_loading:
+            self.model = str(self.get_value_from_config('model'))
+            self.weights = str(self.get_value_from_config('weights'))
+            self.network = caffe.Net(self.model, self.weights, caffe.TEST)
         self.allow_reshape_input = self.get_value_from_config('allow_reshape_input')
 
         match = re.match(DEVICE_REGEX, self.get_value_from_config('device').lower())
@@ -88,16 +92,20 @@ def batch(self):
     def output_blob(self):
         return next(iter(self.network.outputs))
 
-    def fit_to_input(self, data, layer_name, layout):
+    def fit_to_input(self, data, layer_name, layout, precision):
         data_shape = np.shape(data)
-        data = np.transpose(data, layout) if len(data_shape) == 4 else np.array(data)
         layer_shape = self.inputs[layer_name]
+        if len(data_shape) == 5 and len(layer_shape) == 4:
+            data = data[0]
+            data_shape = np.shape(data)
+        data = np.transpose(data, layout) if len(data_shape) == 4 else np.array(data)
+        data_shape = np.shape(data)
         if layer_shape != data_shape:
-            self.network.blobs[layer_name].reshape(*data.shape)
+            self._do_reshape = True
 
-        return data
+        return data.astype(precision) if precision else precision
 
-    def predict(self, inputs, metadata, *args, **kwargs):
+    def predict(self, inputs, metadata=None, **kwargs):
         """
         Args:
             inputs: dictionary where keys are input layers names and values are data for them.
@@ -107,7 +115,13 @@ def predict(self, inputs, metadata, *args, **kwargs):
         """
         results = []
         for infer_input in inputs:
+            if self._do_reshape:
+                for layer_name, data in infer_input.items():
+                    if data.shape != self.inputs[layer_name]:
+                        self.network.blobs[layer_name].reshape(*data.shape)
+
             results.append(self.network.forward(**infer_input))
+        if metadata is not None:
             for image_meta in metadata:
                 image_meta['input_shape'] = self.inputs_info_for_meta()
 
@@ -116,6 +130,10 @@ def predict(self, inputs, metadata, *args, **kwargs):
     def predict_async(self, *args, **kwargs):
         raise ValueError('Caffe Launcher does not support async mode')
 
+    @staticmethod
+    def create_network(model, weights):
+        return caffe.Net(str(model), str(weights), caffe.TEST)
+
     def release(self):
         """
         Releases launcher.
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher_readme.md
index 79f6c2ce76a..be2451ebce7 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/caffe_launcher_readme.md
@@ -5,7 +5,7 @@ For enabling Caffe launcher you need to add `framework: caffe` in launchers sect
 * `device` - specifies which device will be used for infer (`cpu`, `gpu_0` and so on).
 * `model` - path to prototxt file with Caffe model for your topology.
 * `weights` - path to caffemodel file with weights for your topology.
-* `adapter` - approach how raw output will be converted to representation of dataset problem, some adapters can be specific to framework. You can find detailed instruction how to use adapters [here](../adapters/README.md]).
+* `adapter` - approach how raw output will be converted to representation of dataset problem, some adapters can be specific to framework. You can find detailed instruction how to use adapters [here](../adapters/README.md).
 
 You also can specify batch size for your model using `batch` and allow to reshape input layer to data shape, using specific parameter: `allow_reshape_input` (default value is False).
 
@@ -18,7 +18,8 @@ Each input description should has following info:
     * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
-    Optionally you can determine `shape` of input (actually does not used, Caffe launcher uses info given from network) and `layout` in case when your model was trained with non-standard data layout (For Caffe default layout is `NCHW`).
+    Optionally you can determine `shape` of input (actually does not used, Caffe launcher uses info given from network), `layout` in case when your model was trained with non-standard data layout (For Caffe default layout is `NCHW`).
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
 Caffe launcher config example:
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher.py
index 1e49a006918..f3f1aab18c6 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher.py
@@ -15,12 +15,12 @@
 """
 
 import subprocess
+import multiprocessing
 from pathlib import Path
 import os
 import platform
 import re
 import numpy as np
-from cpuinfo import get_cpu_info
 import openvino.inference_engine as ie
 
 from ..config import ConfigError, NumberField, PathField, StringField, DictField, ListField, BoolField, BaseField
@@ -38,18 +38,24 @@
 from .model_conversion import convert_model, FrameworkParameters
 from ..logging import print_info
 
+try:
+    from cpuinfo import get_cpu_info
+except ImportError:
+    get_cpu_info = None
+
 
 HETERO_KEYWORD = 'HETERO:'
 MULTI_DEVICE_KEYWORD = 'MULTI:'
 FPGA_COMPILER_MODE_VAR = 'CL_CONTEXT_COMPILER_MODE_INTELFPGA'
 NIREQ_REGEX = r"(\(\d+\))"
+MYRIAD_WITH_DEVICE_ID = r"MYRIAD\.*.*"
 HETERO_MODE_REGEX = r"(?:^{hetero}(?P<devices>(?:{devices})(?:,(?:{devices}))*)$)".format(
-    hetero=HETERO_KEYWORD, devices="|".join(ie.known_plugins)
+    hetero=HETERO_KEYWORD, devices="|".join(ie.known_plugins + [MYRIAD_WITH_DEVICE_ID])
 )
 MULTI_DEVICE_MODE_REGEX = r"(?:^{multi}(?P<devices_ireq>(?:{devices_ireq})(?:,(?:{devices_ireq}))*)$)".format(
-    multi=MULTI_DEVICE_KEYWORD, devices_ireq="{}?|".format(NIREQ_REGEX).join(ie.known_plugins)
+    multi=MULTI_DEVICE_KEYWORD, devices_ireq="{}?|".format(NIREQ_REGEX).join(ie.known_plugins + [MYRIAD_WITH_DEVICE_ID])
 )
-DEVICE_REGEX = r"(?:^(?P<device>{devices})$)".format(devices="|".join(ie.known_plugins))
+DEVICE_REGEX = r"(?:^(?P<device>{devices})$)".format(devices="|".join(ie.known_plugins + [MYRIAD_WITH_DEVICE_ID]))
 SUPPORTED_DEVICE_REGEX = r"{multi}|{hetero}|{regular}".format(
     multi=MULTI_DEVICE_MODE_REGEX, hetero=HETERO_MODE_REGEX, regular=DEVICE_REGEX
 )
@@ -93,7 +99,6 @@ def __init__(self, config_uri, **kwargs):
     def validate(self, entry, field_uri=None):
         """
         Validate that launcher entry meets all configuration structure requirements.
-
         Args:
             entry: launcher configuration file entry.
             field_uri: id of launcher entry.
@@ -169,7 +174,7 @@ def parameters(cls):
             'device': StringField(regex=SUPPORTED_DEVICE_REGEX, description="Device name."),
             'caffe_model': PathField(optional=True, description="Path to Caffe model file."),
             'caffe_weights': PathField(optional=True, description="Path to Caffe weights file."),
-            'mxnet_weights': PathField(optional=True, description="Path to MxNet weights file."),
+            'mxnet_weights': PathField(optional=True, description="Path to MXNet weights file."),
             'tf_model': PathField(optional=True, description="Path to TF model file."),
             'tf_meta': PathField(optional=True, description="Path to TF meta file."),
             'onnx_model': PathField(optional=True, description="Path to ONNX model file."),
@@ -197,15 +202,18 @@ def parameters(cls):
                 optional=True, is_directory=True, description="TF Object Detection API Config."
             ),
             '_tf_custom_op_config_dir': PathField(
-                optional=True, is_directory=True, description="TF Custom Operation Config."
+                optional=True, is_directory=True, description="TF Custom Operation Config prefix."
             ),
+            '_transformations_config_dir': PathField(
+                optional=True, is_directory=True, description="Transformation config prefix for Model Optimizer"),
             '_tf_obj_detection_api_pipeline_config_path': PathField(
                 optional=True, is_directory=False, description="TF Custom Operation Pipeline Config."),
             '_cpu_extensions_mode': StringField(optional=True, description="CPU extensions mode."),
             '_aocl': PathField(optional=True, description="path to aocl (FPGA only)"),
             '_vpu_log_level': StringField(
                 optional=True, choices=VPU_LOG_LEVELS, description="VPU LOG level: {}".format(', '.join(VPU_LOG_LEVELS))
-            )
+            ),
+            '_prev_bitstream': PathField(optional=True, description="path to bitstream from previous run (FPGA only)")
         })
 
         return parameters
@@ -219,6 +227,7 @@ def __init__(self, config_entry, delayed_model_loading=False):
         dlsdk_launcher_config.validate(self.config)
 
         self._device = self.config['device'].upper()
+        self._device_ids = self._check_device_id()
         self._set_variable = False
         self._prepare_bitstream_firmware(self.config)
         self._delayed_model_loading = delayed_model_loading
@@ -230,7 +239,7 @@ def __init__(self, config_entry, delayed_model_loading=False):
                 self._model = self.get_value_from_config('model')
                 self._weights = self.get_value_from_config('weights')
 
-            self.load_network()
+            self.load_network(log=True)
 
         self.allow_reshape_input = self.get_value_from_config('allow_reshape_input')
         self._do_reshape = False
@@ -269,32 +278,18 @@ def predict(self, inputs, metadata=None, **kwargs):
                 input_shapes = {layer_name: data.shape for layer_name, data in infer_inputs.items()}
                 self._reshape_input(input_shapes)
 
-            benchmark = kwargs.get('benchmark')
-
-            if benchmark:
-                benchmark(infer_inputs)
-
             result = self.exec_network.infer(infer_inputs)
-
-            raw_outputs_callback = kwargs.get('output_callback')
-
-            if raw_outputs_callback:
-                raw_outputs_callback(result, network=self.network, exec_network=self.exec_network)
             results.append(result)
 
         if metadata is not None:
-            for image_meta in metadata:
-                image_meta['input_shape'] = self.inputs_info_for_meta()
-
+            for meta_ in metadata:
+                meta_['input_shape'] = self.inputs_info_for_meta()
         self._do_reshape = False
 
         return results
 
     def predict_async(self, ir, inputs, metadata=None, **kwargs):
         infer_inputs = inputs[0]
-        benchmark = kwargs.get('benchmark')
-        if benchmark:
-            benchmark(infer_inputs)
         ir.async_infer(inputs=infer_inputs)
         if metadata is not None:
             for meta_ in metadata:
@@ -316,6 +311,18 @@ def _devices_list(self):
 
         return [platform_.upper().strip() for platform_ in device.split(',')]
 
+    def _check_device_id(self):
+        device_list = self._devices_list()
+        myriad_devices = [device_name for device_name in device_list if device_name.startswith('MYRIAD')]
+        device_ids = []
+        for myriad_device in myriad_devices:
+            device_with_id = myriad_device.split('.')
+            device_ids.append('.'.join(device_with_id[1:]).lower() if len(device_with_id) > 1 else None)
+        for devise_id in device_ids:
+            if devise_id is not None:
+                self._device = self._device.replace('.' + devise_id.upper(), '')
+        return device_ids
+
     def _set_affinity(self, affinity_map_path):
         self.plugin.set_initial_affinity(self.network)
         layers = self.network.layers
@@ -347,20 +354,25 @@ def _prepare_bitstream_firmware(self, config):
 
         bitstream = config.get('bitstream')
         if bitstream:
-            print_info('programming bitstream: {}'.format(bitstream.name))
-            aocl_executable = config.get('_aocl')
-            if aocl_executable:
-                subprocess.run([str(aocl_executable), 'program', 'acl0', str(bitstream)], check=True)
+            previous_bitstream = config.get('_prev_bitstream', '')
+            if str(previous_bitstream) != str(bitstream):
+                print_info('programming bitstream: {}'.format(bitstream.name))
+                aocl_executable = config.get('_aocl')
+                if aocl_executable:
+                    subprocess.run([str(aocl_executable), 'program', 'acl0', str(bitstream)], check=True)
+                    os.environ[FPGA_COMPILER_MODE_VAR] = '3'
+                    self._set_variable = True
+                else:
+                    aocx_variable = 'DLA_AOCX'
+                    previous_bitstream = os.environ.get(aocx_variable)
+                    if previous_bitstream == str(bitstream):
+                        return
+                    os.environ[aocx_variable] = str(bitstream)
+                    if not os.environ.get(aocx_variable):
+                        warning('Warning: {} has not been set'.format(aocx_variable))
+            else:
                 os.environ[FPGA_COMPILER_MODE_VAR] = '3'
                 self._set_variable = True
-            else:
-                aocx_variable = 'DLA_AOCX'
-                previous_bitstream = os.environ.get(aocx_variable)
-                if previous_bitstream == str(bitstream):
-                    return
-                os.environ[aocx_variable] = str(bitstream)
-                if not os.environ.get(aocx_variable):
-                    warning('Warning: {} has not been set'.format(aocx_variable))
 
     @staticmethod
     def get_cpu_extension(cpu_extensions, selection_mode):
@@ -372,6 +384,10 @@ def get_cpu_extensions_list(file_format, base_name, selection_mode):
                 if extension_list:
                     return extension_list
 
+                if get_cpu_info is None:
+                    raise ValueError('CPU extensions automatic search requires pycpuinfo. '
+                                     'Please install it or set cpu extensions lib directly')
+
                 cpu_info_flags = get_cpu_info()['flags']
                 supported_flags = ['avx512', 'avx2', 'sse4_1', 'sse4_2']
                 cpu_info_flag_to_suffix = {
@@ -451,8 +467,12 @@ def convert_model(config, framework=None):
             get_parameter_value_from_config(config, DLSDKLauncher.parameters(), 'mo_params'),
             get_parameter_value_from_config(config, DLSDKLauncher.parameters(), 'mo_flags'),
             get_parameter_value_from_config(config, DLSDKLauncher.parameters(), '_tf_custom_op_config_dir'),
-            get_parameter_value_from_config(config, DLSDKLauncher.parameters(),
-                                            '_tf_obj_detection_api_pipeline_config_path'),
+            get_parameter_value_from_config(
+                config, DLSDKLauncher.parameters(), '_tf_obj_detection_api_pipeline_config_path'
+            ),
+            get_parameter_value_from_config(
+                config, DLSDKLauncher.parameters(), '_transformations_config_dir'
+            ),
             should_log_cmd=should_log_mo_cmd
         )
 
@@ -483,7 +503,6 @@ def _reshape_input(self, shapes):
             self.network.reshape(shapes)
 
         self.exec_network = self.plugin.load(network=self.network, num_requests=self._num_requests)
-        self._do_reshape = False
 
     def _set_batch_size(self, batch_size):
         # in some cases we can not use explicit property for setting batch size, so we need to use reshape instead
@@ -517,12 +536,24 @@ def _align_data_shape(self, data, input_blob):
             filled_part = [data[-1]] * diff_number
             data = np.concatenate([data, filled_part])
 
-        if len(data.shape) > 1 and len(input_shape) > 1 and data.shape[1] != input_shape[1]:
-            data = data[:, :input_shape[1]]
-
         return data.reshape(input_shape)
 
     def create_ie_plugin(self, log=True):
+        def set_nireq():
+            num_requests = self.config.get('num_requests')
+            if num_requests is not None:
+                num_requests = get_or_parse_value(num_requests, casting_type=int)
+                if len(num_requests) != 1:
+                    raise ConfigError('Several values for _num_requests specified')
+                self._num_requests = num_requests[0]
+                if self._num_requests != 1 and not self.async_mode:
+                    warning('{} infer requests in sync mode is not supported. Only 1 infer request will be used.')
+                    self._num_requests = 1
+            elif not self.async_mode:
+                self._num_requests = 1
+            else:
+                self._num_requests = self.auto_num_requests()
+
         if hasattr(self, 'plugin'):
             del self.plugin
         if log:
@@ -532,16 +563,14 @@ def create_ie_plugin(self, log=True):
         else:
             self.plugin = ie.IEPlugin(self._device)
             self.async_mode = self.get_value_from_config('async_mode')
-            num_requests = get_or_parse_value(self.config.get('num_requests', 1), casting_type=int)
-            if len(num_requests) != 1:
-                raise ConfigError('Several values for _num_requests specified')
-            self._num_requests = num_requests[0]
-            if self._num_requests != 1 and not self.async_mode:
-                warning('{} infer requests in sync mode is not supported. Only 1 infer request will be used.')
-                self._num_requests = 1
+            set_nireq()
+
             if log:
                 print_info('Loaded {} plugin version: {}'.format(self.plugin.device, self.plugin.version))
-
+        if self._device_ids:
+            correct_id = [device_id for device_id in self._device_ids if device_id is not None]
+            if correct_id:
+                self.plugin.set_config({'DEVICE_ID': correct_id[0]})
         cpu_extensions = self.config.get('cpu_extensions')
         if cpu_extensions and 'CPU' in self._devices_list():
             selection_mode = self.config.get('_cpu_extensions_mode')
@@ -553,7 +582,29 @@ def create_ie_plugin(self, log=True):
         if self._is_vpu():
             log_level = self.config.get('_vpu_log_level')
             if log_level:
-                self.plugin.set_config({'VPU_LOG_LEVEL': log_level})
+                self.plugin.set_config({'LOG_LEVEL': log_level})
+
+    def auto_num_requests(self):
+        concurrency_device = {
+            'CPU': 1,
+            'GPU': 1,
+            'HDDL': 100,
+            'MYRIAD': 4,
+            'FPGA': 3
+        }
+        platform_list = self._devices_list()
+        if 'CPU' in platform_list and len(platform_list) == 1:
+            min_requests = [4, 5, 3]
+            cpu_count = multiprocessing.cpu_count()
+            for min_request in min_requests:
+                if cpu_count % min_request == 0:
+                    return max(min_request, cpu_count / min_request)
+        if 'GPU' in platform_list and len(platform_list) == 1:
+            return 2
+        concurrency = 0
+        for device in platform_list:
+            concurrency += concurrency_device.get(device, 1)
+        return concurrency
 
     def _create_multi_device_plugin(self, log=True):
         async_mode = self.get_value_from_config('async_mode')
@@ -618,7 +669,7 @@ def output_preprocessing(output_string):
         elif affinity_map_path:
             warning('affinity_map config is applicable only for HETERO device')
 
-    def load_network(self, network=None):
+    def load_network(self, network=None, log=False):
         if hasattr(self, 'exec_network'):
             del self.exec_network
         if not hasattr(self, 'plugin'):
@@ -627,12 +678,15 @@ def load_network(self, network=None):
             self._create_network()
         else:
             self.network = network
+        self._set_precision()
+        if log:
+            self._print_input_output_info()
         self.exec_network = self.plugin.load(network=self.network, num_requests=self.num_requests)
 
-    def load_ir(self, xml_path, bin_path):
+    def load_ir(self, xml_path, bin_path, log=False):
         self._model = xml_path
         self._weights = bin_path
-        self.load_network()
+        self.load_network(log=log)
 
     @staticmethod
     def create_ie_network(model_xml, model_bin):
@@ -644,7 +698,7 @@ def inputs_info_for_meta(self):
             if layer_name not in self.const_inputs + self.image_info_inputs
         }
 
-    def fit_to_input(self, data, layer_name, layout):
+    def fit_to_input(self, data, layer_name, layout, precision):
         def data_to_blob(layer_shape, data):
             data_shape = np.shape(data)
             if len(layer_shape) == 4:
@@ -654,12 +708,16 @@ def data_to_blob(layer_shape, data):
 
             if len(layer_shape) == 2 and len(data_shape) == 1:
                 return np.transpose([data])
+            if len(layer_shape) == 5 and len(layout) == 5:
+                return np.transpose(data, layout)
 
             return np.array(data)
 
         layer_shape = tuple(self.inputs[layer_name].shape)
 
         data = data_to_blob(layer_shape, data)
+        if precision:
+            data = data.astype(precision)
 
         data_shape = np.shape(data)
         if data_shape != layer_shape:
@@ -669,6 +727,24 @@ def data_to_blob(layer_shape, data):
 
         return self._align_data_shape(data, layer_name)
 
+    def _set_precision(self):
+        config_inputs = self.config.get('inputs', [])
+        for input_config in config_inputs:
+            if 'precision' in input_config:
+                self.network.inputs[input_config['name']].precision = input_config['precision']
+
+    def _print_input_output_info(self):
+        print_info('Input info:')
+        for name, input_info in self.network.inputs.items():
+            print_info('\tLayer name: {}'.format(name))
+            print_info('\tprecision: {}'.format(input_info.precision))
+            print_info('\tshape {}\n'.format(input_info.shape))
+        print_info('Output info')
+        for name, output_info in self.network.outputs.items():
+            print_info('\tLayer name: {}'.format(name))
+            print_info('\tprecision: {}'.format(output_info.precision))
+            print_info('\tshape {}\n'.format(output_info.shape))
+
     def release(self):
         if 'network' in self.__dict__:
             del self.network
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher_readme.md
index 6f43af8063d..4398c453b41 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/dlsdk_launcher_readme.md
@@ -2,7 +2,10 @@
 
 For enabling OpenVINO™ launcher you need to add `framework: dlsdk` in launchers section of your configuration file and provide following parameters:
 
-* `device` - specifies which device will be used for infer. Supported: `CPU`, `GPU`, `FPGA`, `MYRIAD`, Heterogeneous plugin as `HETERO:target_device,fallback_device` and Multi device plugin as `MULTI:target_device1,target_device2`. You are able to not specify device intently and provide one or several devices via `-td, --target devices` command line argument. Target device will be selected from command line (in turn when several devices provided, evaluations will be run one by one with all specified devices).
+* `device` - specifies which device will be used for infer. Supported: `CPU`, `GPU`, `FPGA`, `MYRIAD`, `HDDL`,
+Heterogeneous plugin as `HETERO:target_device,fallback_device` and Multi device plugin as `MULTI:target_device1,target_device2`.
+If you have several MYRIAD devices in your machine, you are able to provide specific device id in such way: `MYRIAD.<DEVICE_ID>` (e.g. `MYRIAD.1.2-ma2480`)
+It is possible to specify one or more devices via `-td, --target devices` command line argument. Target device will be selected from command line (in case when several devices provided, evaluations will be run one by one with all specified devices).
 * `model` - path to xml file with Caffe model for your topology.
 * `weights` - path to bin file with weights for your topology.
 
@@ -47,7 +50,8 @@ Each input description should has following info:
     * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
-    Optionally you can determine `shape` of input (actually does not used, DLSDK launcher uses info given from network) and `layout` in case when your model was trained with non-standard data layout (For DLSDK default layout is `NCHW`).
+    Optionally you can determine `shape` of input (actually does not used, DLSDK launcher uses info given from network), `layout` in case when your model was trained with non-standard data layout (For DLSDK default layout is `NCHW`)
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
 OpenVINO™ launcher config example:
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/dummy_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/dummy_launcher.py
index 0076739b258..54cad87e0f0 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/dummy_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/dummy_launcher.py
@@ -21,6 +21,7 @@
 from .loaders import Loader
 from .launcher import Launcher, LauncherConfigValidator
 
+
 class DummyLauncher(Launcher):
     """
     Class for using predictions from another tool.
@@ -46,7 +47,7 @@ def __init__(self, config_entry: dict, *args, **kwargs):
 
         self.data_path = get_path(self.get_value_from_config('data_path'))
 
-        self._loader = Loader.provide(self.get_value_from_config['loader'], self.data_path)
+        self._loader = Loader.provide(self.get_value_from_config('loader'), self.data_path)
 
         print_info("{} predictions objects loaded from {}".format(len(self._loader), self.data_path))
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/input_feeder.py b/tools/accuracy_checker/accuracy_checker/launcher/input_feeder.py
index 2cdabcd2164..76196211665 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/input_feeder.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/input_feeder.py
@@ -19,21 +19,38 @@
 
 from ..config import ConfigError
 from ..utils import extract_image_representations
+from ..data_readers import MultiFramesInputIdentifier
 
 LAYER_LAYOUT_TO_IMAGE_LAYOUT = {
     'NCHW': [0, 3, 1, 2],
     'NHWC': [0, 1, 2, 3],
     'NCWH': [0, 3, 2, 1],
-    'NWHC': [0, 2, 1, 3]
+    'NWHC': [0, 2, 1, 3],
+    'NCDHW': [0, 4, 1, 2, 3],
+    'NDCHW': [0, 1, 4, 2, 3],
+    'NDHWC': [0, 1, 2, 3, 4]
+}
+
+PRECISION_TO_DTYPE = {
+    'FP32': np.float32,  # float
+    'FP16': np.float16,  # signed short
+    'U8': np.uint8,  # unsigned char
+    'U16': np.uint16,  # unsigned short
+    'I8': np.int8,  # signed char
+    'I16': np.int16,  # signed short
+    'I32': np.int32,  # signed int
+    'I64': np.int64,  # signed long int
 }
 
 
 class InputFeeder:
     def __init__(self, inputs_config, network_inputs, prepare_input_data=None, default_layout='NCHW'):
-        def fit_to_input(data, input_layer_name, layout):
+        def fit_to_input(data, input_layer_name, layout, precision):
             if len(np.shape(data)) == 4:
-                return np.transpose(data, layout)
-            return np.array(data)
+                data = np.transpose(data, layout)
+            else:
+                data = np.array(data)
+            return data.astype(precision) if precision else data
 
         self.input_transform_func = prepare_input_data or fit_to_input
         self.network_inputs = network_inputs
@@ -49,7 +66,7 @@ def __call__(self, context, *args, **kwargs):
     def configure(self, inputs_config):
         parsing_results = self._parse_inputs_config(inputs_config, self.default_layout)
         self.const_inputs, self.non_constant_inputs = parsing_results[:2]
-        self.inputs_mapping, self.image_info_inputs, self.layouts_mapping = parsing_results[2:]
+        self.inputs_mapping, self.image_info_inputs, self.layouts_mapping, self.precision_mapping = parsing_results[2:]
         if not self.non_constant_inputs:
             raise ConfigError('Network should contain at least one layer for setting variable data.')
 
@@ -77,8 +94,10 @@ def prepare_image_info(image_sizes_batch):
         return image_infos
 
     def fill_non_constant_inputs(self, data_representation_batch):
-        image_info_inputs = self._fill_image_info_inputs(data_representation_batch)
-        filled_inputs = {**image_info_inputs}
+        filled_inputs = {}
+        if self.image_info_inputs:
+            image_info_inputs = self._fill_image_info_inputs(data_representation_batch)
+            filled_inputs = {**image_info_inputs}
         for input_layer in self.non_constant_inputs:
             input_regex = None
             input_batch = []
@@ -88,20 +107,26 @@ def fill_non_constant_inputs(self, data_representation_batch):
                 input_data = None
                 identifiers = data_representation.identifier
                 data = data_representation.data
-                if not isinstance(identifiers, list) and not input_regex:
+                if not isinstance(identifiers, list) and input_regex is None:
                     input_data = data
                     input_batch.append(input_data)
                     continue
 
-                if not input_regex:
+                if input_regex is None:
                     raise ConfigError('Impossible to choose correct data for layer {}.'
                                       'Please provide regular expression for matching in config.'.format(input_layer))
-                data = [data] if np.isscalar(identifiers) else data
-                identifiers = [identifiers] if np.isscalar(identifiers) else identifiers
-                for identifier, data_value in zip(identifiers, data):
-                    if input_regex.match(identifier):
-                        input_data = data_value
-                        break
+                if isinstance(identifiers, MultiFramesInputIdentifier):
+                    input_id_order = {
+                        input_index: frame_id for frame_id, input_index in enumerate(identifiers.input_id)
+                    }
+                    input_data = data[input_id_order[input_regex]]
+                else:
+                    data = [data] if np.isscalar(identifiers) else data
+                    identifiers = [identifiers] if np.isscalar(identifiers) else identifiers
+                    for identifier, data_value in zip(identifiers, data):
+                        if input_regex.match(identifier):
+                            input_data = data_value
+                            break
                 if input_data is None:
                     raise ConfigError('Suitable data for filling layer {} not found'.format(input_layer))
                 input_batch.append(input_data)
@@ -117,32 +142,47 @@ def fill_inputs(self, data_representation_batch):
         return inputs
 
     def _parse_inputs_config(self, inputs_entry, default_layout='NCHW'):
+        def get_layer_precision(input_config, input_name):
+            if 'precision' not in input_config:
+                return None
+            input_precision = PRECISION_TO_DTYPE.get(input_config['precision'])
+            if input_precision is None:
+                raise ConfigError("unsupported precision {} for layer {}".format(input_config['precision'], input_name))
+            precisions[input_name] = input_precision
+            return input_precision
+
         constant_inputs = {}
         non_constant_inputs_mapping = {}
         config_non_constant_inputs = []
         layouts = {}
+        precisions = {}
         image_info_inputs = []
+
         for input_ in inputs_entry:
             name = input_['name']
-            if not name in self.network_inputs:
+            if name not in self.network_inputs:
                 raise ConfigError('network does not contain input "{}"'.format(name))
 
             if input_['type'] == 'IMAGE_INFO':
                 image_info_inputs.append(name)
+                get_layer_precision(input_, name)
                 continue
             value = input_.get('value')
 
             if input_['type'] == 'CONST_INPUT':
                 if isinstance(value, list):
                     value = np.array(value)
+                    precision = get_layer_precision(input_, name)
+                    value = value.astype(precision) if precision is not None else value
                 constant_inputs[name] = value
             else:
                 config_non_constant_inputs.append(name)
-                if value:
-                    value = re.compile(value)
+                if value is not None:
+                    value = re.compile(value) if not isinstance(value, int) else value
                     non_constant_inputs_mapping[name] = value
                 layout = input_.get('layout', default_layout)
                 layouts[name] = LAYER_LAYOUT_TO_IMAGE_LAYOUT[layout]
+                get_layer_precision(input_, name)
 
         all_config_inputs = config_non_constant_inputs + list(constant_inputs.keys()) + image_info_inputs
         not_config_inputs = [input_layer for input_layer in self.network_inputs if input_layer not in all_config_inputs]
@@ -150,7 +190,14 @@ def _parse_inputs_config(self, inputs_entry, default_layout='NCHW'):
             raise ConfigError('input value for {} are not presented in config.'.format(','.join(not_config_inputs)))
         non_constant_inputs = not_config_inputs + config_non_constant_inputs
 
-        return constant_inputs, non_constant_inputs, non_constant_inputs_mapping or None, image_info_inputs, layouts
+        return (
+            constant_inputs,
+            non_constant_inputs,
+            non_constant_inputs_mapping or None,
+            image_info_inputs,
+            layouts,
+            precisions
+        )
 
     def _transform_batch(self, batch_data, meta):
         def calculate_num_splits(layers_data, batch_size):
@@ -183,14 +230,16 @@ def separate_data(data, num_splits):
                 for infer_id, on_infer_batch in enumerate(batch_for_all_infers):
                     infers_data[infer_id][layer_name] = self.input_transform_func(
                         on_infer_batch, layer_name,
-                        self.layouts_mapping.get(layer_name, LAYER_LAYOUT_TO_IMAGE_LAYOUT[self.default_layout])
+                        self.layouts_mapping.get(layer_name, LAYER_LAYOUT_TO_IMAGE_LAYOUT[self.default_layout]),
+                        self.precision_mapping.get(layer_name)
                     )
             return infers_data
 
         for layer_name, layer_data in batch_data.items():
             batch_data[layer_name] = self.input_transform_func(
                 layer_data, layer_name,
-                self.layouts_mapping.get(layer_name, LAYER_LAYOUT_TO_IMAGE_LAYOUT[self.default_layout])
+                self.layouts_mapping.get(layer_name, LAYER_LAYOUT_TO_IMAGE_LAYOUT[self.default_layout]),
+                self.precision_mapping.get(layer_name)
             )
 
         return [batch_data]
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/launcher.py
index 414440a2ab1..cfb36b0af1a 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/launcher.py
@@ -137,10 +137,12 @@ def _provide_inputs_info_to_meta(self, meta):
         return meta
 
     @staticmethod
-    def fit_to_input(data, layer_name, layout):
+    def fit_to_input(data, layer_name, layout, precision):
         if len(np.shape(data)) == 4:
-            return np.transpose(data, layout)
-        return np.array(data)
+            data = np.transpose(data, layout)
+        else:
+            data = np.array(data)
+        return data.astype(precision) if precision else data
 
     def inputs_info_for_meta(self):
         return {
@@ -152,6 +154,7 @@ def inputs_info_for_meta(self):
     def name(self):
         return self.__provider__
 
+
 def unsupported_launcher(name, error_message=None):
     class UnsupportedLauncher(Launcher):
         __provider__ = name
@@ -179,6 +182,7 @@ def create_launcher(launcher_config, delayed_model_loading=False):
     """
     Args:
         launcher_config: launcher configuration file entry.
+        delayed_model_loading: allows postpone model loading to the launcher
     Returns:
         framework-specific launcher object.
     """
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/model_conversion.py b/tools/accuracy_checker/accuracy_checker/launcher/model_conversion.py
index 03876b4660f..fc1f30b24d5 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/model_conversion.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/model_conversion.py
@@ -27,7 +27,9 @@
 
 def convert_model(topology_name, model=None, weights=None, meta=None,
                   framework=FrameworkParameters('caffe', False), mo_search_paths=None, mo_params=None, mo_flags=None,
-                  tf_custom_op_config_dir=None, tf_object_detection_api_config_dir=None, should_log_cmd=False):
+                  tf_custom_op_config_dir=None, tf_object_detection_api_config_dir=None,
+                  transformations_config_dir=None,
+                  should_log_cmd=False):
     """
     Args:
         topology_name: name for converted model files.
@@ -38,8 +40,10 @@ def convert_model(topology_name, model=None, weights=None, meta=None,
         mo_search_paths: paths where ModelOptimizer may be found. If None only default paths is used.
         mo_params: value parameters for ModelOptimizer execution.
         mo_flags: flags parameters for ModelOptimizer execution.
-        tf_custom_op_config_dir: path to Tensor Flow custom operations directory.
+        tf_custom_op_config_dir: path to TensorFlow custom operations directory.
+        transformations_config_dir: path to Model Optimizer transformations extensions directory.
         tf_object_detection_api_config_dir: path to Tensor Flow directory with config for object detection API.
+        should_log_cmd: allows print out command line arguments for Model Downloader.
     Returns:
         paths to converted to IE IR model and weights.
     """
@@ -68,7 +72,10 @@ def convert_model(topology_name, model=None, weights=None, meta=None,
     mo_params['framework'] = framework.name
     mo_params.update(framework_specific_options.get(framework, {}))
 
-    set_path_to_custom_operation_configs(mo_params, framework, tf_custom_op_config_dir, model_optimizer_executable)
+    set_path_to_tf_custom_operation_configs(
+        mo_params, framework, tf_custom_op_config_dir, model_optimizer_executable
+    )
+    set_path_to_transformation_configs(mo_params, framework, transformations_config_dir, model_optimizer_executable)
     set_path_to_object_detection_api_pipeline_config(mo_params, framework, tf_object_detection_api_config_dir)
     args = prepare_args(str(model_optimizer_executable), flag_options=mo_flags, value_options=mo_params)
 
@@ -162,6 +169,7 @@ def print_cmd(args, indent=0):
     if arr_to_print:
         print_info(indent_str + " ".join(arr_to_print))
 
+
 def exec_mo_binary(args, timeout=None, should_log_cmd=False):
     """
     Args:
@@ -177,24 +185,42 @@ def exec_mo_binary(args, timeout=None, should_log_cmd=False):
     return subprocess.run(args, check=False, timeout=timeout)
 
 
-def set_path_to_custom_operation_configs(mo_params, framework, tf_custom_op_config_dir, mo_path):
+def set_path_to_tf_custom_operation_configs(
+        mo_params, framework, tf_custom_op_config_dir, mo_path
+):
     if framework.name != 'tf':
         return mo_params
 
-    config_path = mo_params.get('tensorflow_use_custom_operations_config')
-    if not config_path:
+    tf_custom_op_config_path = mo_params.get('tensorflow_use_custom_operations_config')
+    if not tf_custom_op_config_path:
         return mo_params
 
     if tf_custom_op_config_dir:
-        tf_custom_op_config_dir = Path(tf_custom_op_config_dir)
+        prefix_dir = Path(tf_custom_op_config_dir)
     else:
-        tf_custom_op_config_dir = Path('/').joinpath(*mo_path.parts[:-1]) / 'extensions' / 'front' / 'tf'
+        prefix_dir = Path('/').joinpath(*mo_path.parts[:-1]) / 'extensions' / 'front' / 'tf'
 
-    config_path = Path(config_path)
+    config_path = Path(tf_custom_op_config_path)
     if not config_path.is_absolute():
-        config_path = tf_custom_op_config_dir / config_path
+        config_path = prefix_dir / config_path
+        mo_params['tensorflow_use_custom_operations_config'] = str(get_path(config_path))
+
+    return mo_params
+
 
-    mo_params['tensorflow_use_custom_operations_config'] = str(get_path(config_path))
+def set_path_to_transformation_configs(mo_params, framework, transformation_config_dir, mo_path):
+    transformation_config_path = mo_params.get('transformations_config')
+    if not transformation_config_path:
+        return mo_params
+
+    if transformation_config_dir:
+        prefix_dir = Path(transformation_config_dir)
+    else:
+        prefix_dir = Path('/').joinpath(*mo_path.parts[:-1]) / 'extensions' / 'front' / framework.name
+    config_path = Path(transformation_config_path)
+    if not config_path.is_absolute():
+        config_path = prefix_dir / config_path
+        mo_params['transformations_config'] = str(get_path(config_path))
 
     return mo_params
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher.py
index e3019c38d66..114c734f097 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher.py
@@ -39,7 +39,7 @@ def validate(self, entry, field_uri=None):
 
 class MxNetLauncher(Launcher):
     """
-    Class for infer model using MxNet framework
+    Class for infer model using MXNet framework
     """
     __provider__ = 'mxnet'
 
@@ -57,59 +57,63 @@ def parameters(cls):
 
     def __init__(self, config_entry: dict, *args, **kwargs):
         super().__init__(config_entry, *args, **kwargs)
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
 
-        mxnet_launcher_config = MxNetLauncherConfigValidator('MxNet_Launcher', fields=self.parameters())
-        mxnet_launcher_config.validate(self.config)
-
-        # Get model name, prefix, epoch
-        self.model = self.config['model']
-        model_path, model_file = self.model.parent, self.model.name
-        model_name = model_file.rsplit('.', 1)[0]
-        model_prefix, model_epoch = model_name.rsplit('-', 1)
-
-        # Get device and set device context
-        match = re.match(DEVICE_REGEX, self.config['device'].lower())
-        if match.group('device') == 'gpu':
-            identifier = match.group('identifier')
-            if identifier is None:
-                identifier = 0
-            device_context = mxnet.gpu(int(identifier))
-        else:
-            device_context = mxnet.cpu()
-
-        # Get batch from config or 1
-        self._batch = self.config.get('batch', 1)
-
-        # Get input shapes
-        input_shapes = []
-
-        for input_config in self.config['inputs']:
-            input_shape = input_config['shape']
-            input_shape = string_to_tuple(input_shape, casting_type=int)
-            input_shapes.append((input_config['name'], (self._batch, *input_shape)))
-
-        # Load checkpoints
-        sym, arg_params, aux_params = mxnet.model.load_checkpoint(
-            model_path / model_prefix, int(model_epoch)
+        mxnet_launcher_config = MxNetLauncherConfigValidator(
+            'MxNet_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading
         )
-        self._inputs = OrderedDict(input_shapes)
-        # Create a module
-        self.module = mxnet.mod.Module(symbol=sym, context=device_context, label_names=None)
-        self.module.bind(for_training=False, data_shapes=input_shapes)
-        self.module.set_params(arg_params, aux_params, allow_missing=True)
+        mxnet_launcher_config.validate(self.config)
+        if not self._delayed_model_loading:
+            # Get model name, prefix, epoch
+            self.model = self.config['model']
+            model_path, model_file = self.model.parent, self.model.name
+            model_name = model_file.rsplit('.', 1)[0]
+            model_prefix, model_epoch = model_name.rsplit('-', 1)
+
+            # Get device and set device context
+            match = re.match(DEVICE_REGEX, self.config['device'].lower())
+            if match.group('device') == 'gpu':
+                identifier = match.group('identifier')
+                if identifier is None:
+                    identifier = 0
+                device_context = mxnet.gpu(int(identifier))
+            else:
+                device_context = mxnet.cpu()
+
+            # Get batch from config or 1
+            self._batch = self.config.get('batch', 1)
+
+            # Get input shapes
+            input_shapes = []
+
+            for input_config in self.config['inputs']:
+                input_shape = input_config['shape']
+                input_shape = string_to_tuple(input_shape, casting_type=int)
+                input_shapes.append((input_config['name'], (self._batch, *input_shape)))
+
+            # Load checkpoints
+            sym, arg_params, aux_params = mxnet.model.load_checkpoint(
+                model_path / model_prefix, int(model_epoch)
+            )
+            self._inputs = OrderedDict(input_shapes)
+            # Create a module
+            self.module = mxnet.mod.Module(symbol=sym, context=device_context, label_names=None)
+            self.module.bind(for_training=False, data_shapes=input_shapes)
+            self.module.set_params(arg_params, aux_params, allow_missing=True)
 
     @property
     def batch(self):
         return self._batch
 
-    def fit_to_input(self, data, input_layer, layout):
-        return mxnet.nd.array(np.transpose(data, layout))
+    def fit_to_input(self, data, input_layer, layout, precision):
+        data = np.transpose(data, layout)
+        return mxnet.nd.array(data.astype(precision) if precision else data)
 
     @property
     def inputs(self):
         return self._inputs
 
-    def predict(self, inputs, metadata, *args, **kwargs):
+    def predict(self, inputs, metadata=None, **kwargs):
         """
         Args:
             inputs: dictionary where keys are input layers names and values are data for them.
@@ -130,13 +134,14 @@ def predict(self, inputs, metadata, *args, **kwargs):
                 infer_res[layer.replace('_output', '')] = out.asnumpy()
             results.append(infer_res)
 
-        for meta_ in metadata:
-            meta_['input_shape'] = self.inputs_info_for_meta()
+        if metadata is not None:
+            for meta_ in metadata:
+                meta_['input_shape'] = self.inputs_info_for_meta()
 
         return results
 
     def predict_async(self, *args, **kwargs):
-        raise ValueError('MxNet Launcher does not support async mode yet')
+        raise ValueError('MXNet Launcher does not support async mode yet')
 
     @property
     def output_blob(self):
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher_readme.md
index ea08b345965..50ce0919863 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/mxnet_launcher_readme.md
@@ -1,6 +1,6 @@
-# How to configure MxNet launcher
+# How to configure MXNet launcher
 
-For enabling MxNet launcher you need to add `framework: mxnet` in launchers section of your configuration file and provide following parameters:
+For enabling MXNet launcher you need to add `framework: mxnet` in launchers section of your configuration file and provide following parameters:
 
 * `device` - specifies which device will be used for infer (`cpu`, `gpu_0` and so on).
 * `model`- path to params file specifying the numeric arrays used in the network.
@@ -14,10 +14,11 @@ Each input description should has following info:
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
   * `shape` - shape of input layer described as comma-separated of all dimensions size except batch size. 
-    Optionally you can determine `layout` in case when your model was trained with non-standard data layout (For MxNet default layout is `NCHW`).
+    Optionally you can determine `layout` in case when your model was trained with non-standard data layout (For MXNet default layout is `NCHW`)
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 You also can specify batch size for your model using `batch`.
 
-MxNet launcher config example:
+MXNet launcher config example:
 
 ```yml
 launchers:
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/onnx_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/onnx_launcher.py
index 5128bf04b8e..a36e2265b3c 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/onnx_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/onnx_launcher.py
@@ -17,8 +17,12 @@
 import re
 import numpy as np
 import onnxruntime.backend as backend
-from ..config import PathField, StringField
+import onnxruntime as onnx_rt
+from ..logging import warning
+from ..config import PathField, StringField, ListField
 from .launcher import Launcher, LauncherConfigValidator
+from ..utils import contains_all
+
 
 DEVICE_REGEX = r'(?P<device>cpu$|gpu)'
 
@@ -28,17 +32,17 @@ class ONNXLauncher(Launcher):
 
     def __init__(self, config_entry: dict, *args, **kwargs):
         super().__init__(config_entry, *args, **kwargs)
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
 
-        onnx_launcher_config = LauncherConfigValidator('ONNX_Launcher', fields=self.parameters())
+        onnx_launcher_config = LauncherConfigValidator(
+            'ONNX_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading,
+        )
         onnx_launcher_config.validate(self.config)
-
-        self.model = str(self.get_value_from_config('model'))
-
-        device = re.match(DEVICE_REGEX, self.get_value_from_config('device').lower()).group('device')
-        beckend_rep = backend.prepare(model=self.model, device=device.upper())
-        self._inference_session = beckend_rep._session # pylint: disable=W0212
-        outputs = self._inference_session.get_outputs()
-        self.output_names = [output.name for output in outputs]
+        if not self._delayed_model_loading:
+            self.model = self.get_value_from_config('model')
+            self._inference_session = self.create_inference_session(self.model)
+            outputs = self._inference_session.get_outputs()
+            self.output_names = [output.name for output in outputs]
 
     @classmethod
     def parameters(cls):
@@ -46,6 +50,10 @@ def parameters(cls):
         parameters.update({
             'model': PathField(description="Path to model."),
             'device': StringField(regex=DEVICE_REGEX, description="Device name.", optional=True, default='CPU'),
+            'execution_providers': ListField(
+                value_type=StringField(description="Execution provider name.", ),
+                default=['CPUExecutionProvider'], optional=True
+            )
         })
 
         return parameters
@@ -63,23 +71,53 @@ def output_blob(self):
     def batch(self):
         return 1
 
-    def predict(self, inputs, metadata, *args, **kwargs):
+    def create_inference_session(self, model):
+        if 'execution_providers' in self.config:
+            try:
+                session = self._create_session_via_execution_providers_api(model)
+                return session
+            except AttributeError:
+                warning('Execution Providers API is not supported, onnxruntime switched on Backend API')
+        return self._create_session_via_backend_api(model)
+
+    def _create_session_via_execution_providers_api(self, model):
+        session_options = onnx_rt.SessionOptions()
+        session = onnx_rt.InferenceSession(model, sess_options=session_options)
+        self.execution_providers = self.get_value_from_config('execution_providers')
+        available_providers = session.get_providers()
+        contains_all(available_providers, self.execution_providers)
+        session.set_providers(self.execution_providers)
+
+        return session
+
+    def _create_session_via_backend_api(self, model):
+        self.device = re.match(DEVICE_REGEX, self.get_value_from_config('device').lower()).group('device')
+        beckend_rep = backend.prepare(model=str(model), device=self.device.upper())
+        return beckend_rep._session  # pylint: disable=W0212
+
+    def predict(self, inputs, metadata=None, **kwargs):
         results = []
         for infer_input in inputs:
             prediction_list = self._inference_session.run(self.output_names, infer_input)
-            results.append(
-                {output_name: prediction for output_name, prediction in zip(self.output_names, prediction_list)}
-            )
-            for meta_ in metadata:
-                meta_['input_shape'] = self.inputs_info_for_meta()
+            results.append(dict(zip(self.output_names, prediction_list)))
+            if metadata is not None:
+                for meta_ in metadata:
+                    meta_['input_shape'] = self.inputs_info_for_meta()
 
         return results
 
-    @staticmethod
-    def fit_to_input(data, layer_name, layout):
+    def fit_to_input(self, data, layer_name, layout, precision):
+        layer_shape = self.inputs[layer_name]
         if len(np.shape(data)) == 4:
-            return np.transpose(data, layout).astype(np.float32)
-        return np.array(data).astype(np.float32)
+            data = np.transpose(data, layout).astype(np.float32 if not precision else precision)
+            if len(layer_shape) == 3:
+                if np.shape(data)[0] != 1:
+                    raise ValueError('Only for batch size 1 first dimension can be omitted')
+                return data[0]
+            return data
+        if len(np.shape(data)) == 5 and len(layout) == 5:
+            return np.transpose(data, layout).astype(np.float32 if not precision else precision)
+        return np.array(data).astype(np.float32 if not precision else precision)
 
     def predict_async(self, *args, **kwargs):
         raise ValueError('ONNX Runtime Launcher does not support async mode yet')
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/onnx_runtime_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/onnx_runtime_launcher_readme.md
index 99e91c94e4a..27279cc75e4 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/onnx_runtime_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/onnx_runtime_launcher_readme.md
@@ -2,9 +2,13 @@
 
 For enabling ONNX Runtime launcher you need to add `framework: onnx_runtime` in launchers section of your configuration file and provide following parameters:
 
-* `device` - specifies which device will be used for infer (`cpu`, `gpu` and so on).
+* `device` - specifies which device will be used for infer (`cpu`, `gpu` and so on). Optional, cpu used as default or can depend on used executable provider.
 * `model`- path to the network file in ONNX format.
 * `adapter` - approach how raw output will be converted to representation of dataset problem, some adapters can be specific to framework. You can find detailed instruction how to use adapters [here](../adapters/README.md).
+* `execution_providers` - list of execution providers for evaluation, e.g. [OpenVINO Execution Provider](https://github.com/microsoft/onnxruntime/blob/master/docs/execution_providers/OpenVINO-ExecutionProvider.md). Default [`CPUExecutionProvider`] used. 
+
+**Note: execution providers available only with newest versions of ONNXRuntime, if your installed version does not support such API, please update or does not specify this field.**
+
 
 # Specifying model inputs in config.
 
@@ -15,9 +19,10 @@ Each input description should has following info:
     * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
-    Optionally you can determine `shape` of input (actually does not used, ONNX Runtime launcher uses info given from network) and `layout` in case when your model was trained with non-standard data layout (For ONNX Runtime default layout is `NCHW`).
+    Optionally you can determine `shape` of input (actually does not used, ONNX Runtime launcher uses info given from network),`layout` in case when your model was trained with non-standard data layout (For ONNX Runtime default layout is `NCHW`)
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
-MxNet launcher config example:
+MXNet launcher config example:
 
 ```yml
 launchers:
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher.py
index 5c616f8492b..2655d67d9c6 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher.py
@@ -30,11 +30,13 @@
 
 class OpenCVLauncherConfigValidator(LauncherConfigValidator):
     def validate(self, entry, field_uri=None):
+        self.fields['inputs'].optional = self.delayed_model_loading
         super().validate(entry, field_uri)
-        inputs = entry.get('inputs')
-        for input_layer in inputs:
-            if 'shape' not in input_layer:
-                raise ConfigError('input value should have shape field')
+        if not self.delayed_model_loading:
+            inputs = entry.get('inputs')
+            for input_layer in inputs:
+                if 'shape' not in input_layer:
+                    raise ConfigError('input value should have shape field')
 
 
 class OpenCVLauncher(Launcher):
@@ -75,22 +77,16 @@ def parameters(cls):
 
     def __init__(self, config_entry: dict, *args, **kwargs):
         super().__init__(config_entry, *args, **kwargs)
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
 
-        opencv_launcher_config = OpenCVLauncherConfigValidator('OpenCV_Launcher', fields=self.parameters())
+        opencv_launcher_config = OpenCVLauncherConfigValidator(
+            'OpenCV_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading
+        )
         opencv_launcher_config.validate(self.config)
-
-        self.model = str(self.get_value_from_config('model'))
-        self.weights = str(self.get_value_from_config('weights'))
-
-        self.network = cv2.dnn.readNet(self.model, self.weights)
-
         match = re.match(BACKEND_REGEX, self.get_value_from_config('backend').lower())
         selected_backend = match.group('backend')
         print_info('backend: {}'.format(selected_backend))
-        backend = OpenCVLauncher.OPENCV_BACKENDS.get(selected_backend)
-
-        self.network.setPreferableBackend(backend)
-
+        self.backend = OpenCVLauncher.OPENCV_BACKENDS.get(selected_backend)
         match = re.match(DEVICE_REGEX, self.get_value_from_config('device').lower())
         selected_device = match.group('device')
 
@@ -99,21 +95,18 @@ def __init__(self, config_entry: dict, *args, **kwargs):
             if ('FP16' in tags) and (selected_device == 'gpu'):
                 selected_device = 'gpu_fp16'
 
-        target = OpenCVLauncher.TARGET_DEVICES.get(selected_device)
+        self.target = OpenCVLauncher.TARGET_DEVICES.get(selected_device)
 
-        if target is None:
+        if self.target is None:
             raise ConfigError('{} is not supported device'.format(selected_device))
 
-        self.network.setPreferableTarget(target)
-
-        inputs = self.config['inputs']
-
-        def parse_shape_value(shape):
-            return tuple([1, *[int(elem) for elem in get_or_parse_value(shape, ())]])
-
-        self._inputs_shapes = OrderedDict({elem.get('name'): parse_shape_value(elem.get('shape')) for elem in inputs})
-        self.network.setInputsNames(list(self._inputs_shapes.keys()))
-        self.output_names = self.network.getUnconnectedOutLayersNames()
+        if not self._delayed_model_loading:
+            self.model = self.get_value_from_config('model')
+            self.weights = self.get_value_from_config('weights')
+            self.network = self.create_network(self.model, self.weights)
+            self._inputs_shapes = self.get_inputs_from_config(self.config)
+            self.network.setInputsNames(list(self._inputs_shapes.keys()))
+            self.output_names = self.network.getUnconnectedOutLayersNames()
 
     @property
     def inputs(self):
@@ -144,9 +137,7 @@ def predict(self, inputs, metadata=None, **kwargs):
             for blob_name in self._inputs_shapes:
                 self.network.setInput(input_blobs[blob_name].astype(np.float32), blob_name)
             list_prediction = self.network.forward(self.output_names)
-            dict_result = {
-                output_name: output_value for output_name, output_value in zip(self.output_names, list_prediction)
-            }
+            dict_result = dict(zip(self.output_names, list_prediction))
             results.append(dict_result)
 
         if metadata is not None:
@@ -158,6 +149,24 @@ def predict(self, inputs, metadata=None, **kwargs):
     def predict_async(self, *args, **kwargs):
         raise ValueError('OpenCV Launcher does not support async mode yet')
 
+    def create_network(self, model, weights):
+        network = cv2.dnn.readNet(str(model), str(weights))
+        network.setPreferableBackend(self.backend)
+        network.setPreferableTarget(self.target)
+
+        return network
+
+    @staticmethod
+    def get_inputs_from_config(config):
+        inputs = config.get('inputs')
+        if not inputs:
+            raise ConfigError('inputs should be provided in config')
+
+        def parse_shape_value(shape):
+            return tuple([1, *[int(elem) for elem in get_or_parse_value(shape, ())]])
+
+        return OrderedDict([(elem.get('name'), parse_shape_value(elem.get('shape'))) for elem in inputs])
+
     def release(self):
         """
         Releases launcher.
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher_readme.md
index 518d9261e60..e498a494981 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/opencv_launcher_readme.md
@@ -16,7 +16,7 @@ Each input description should has following info:
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
   * `shape` - shape of input layer described as comma-separated of all dimensions size except batch size. 
-    Optionally you can determine `layout` in case when your model was trained with non-standard data layout (For OpenCV default layout is `NCHW`).
+    Optionally you can determine `layout` in case when your model was trained with non-standard data layout (For OpenCV default layout is `NCHW`) and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
 OpenCV launcher config example:
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher.py
new file mode 100644
index 00000000000..da7f6da5e44
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher.py
@@ -0,0 +1,147 @@
+from contextlib import contextmanager
+import sys
+import importlib
+from collections import OrderedDict
+
+import numpy as np
+from ..config import PathField, StringField, DictField, NumberField, ListField
+from .launcher import Launcher, LauncherConfigValidator
+
+MODULE_REGEX = r'(?:\w+)(?:(?:.\w+)*)'
+DEVICE_REGEX = r'(?P<device>cpu$|cuda)?'
+
+
+class PyTorchLauncher(Launcher):
+    __provider__ = 'pytorch'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'module': StringField(regex=MODULE_REGEX, description='Network module for loading'),
+            'checkpoint': PathField(
+                check_exists=True, is_directory=False, optional=True, description='pre-trained model checkpoint'
+            ),
+            'python_path': PathField(
+                check_exists=True, is_directory=True, optional=True,
+                description='appendix for PYTHONPATH for making network module visible in current python environment'
+            ),
+            'module_args': ListField(optional=True, description='positional arguments for network module'),
+            'module_kwargs':  DictField(
+                key_type=str, validate_values=False, optional=True, default={},
+                description='keyword arguments for network module'
+            ),
+            'device': StringField(default='cpu', regex=DEVICE_REGEX),
+            'batch': NumberField(value_type=float, min_value=1, optional=True, description="Batch size.", default=1),
+            'output_names': ListField(
+                optional=True, value_type=str, description='output tensor names'
+            )
+        })
+        return parameters
+
+    def __init__(self, config_entry: dict, *args, **kwargs):
+        super().__init__(config_entry, *args, **kwargs)
+        try:
+            # PyTorch import affects performance of common pipeline
+            # it is the reason, why it is imported only when it used
+            import torch # pylint: disable=C0415
+        except ImportError as import_error:
+            raise ValueError("PyTorch isn't installed. Please, install it before using. \n{}".format(import_error.msg))
+        self._torch = torch
+        pytorch_launcher_config = LauncherConfigValidator('Pytorch_Launcher', fields=self.parameters())
+        pytorch_launcher_config.validate(self.config)
+        module_args = config_entry.get("module_args", ())
+        module_kwargs = config_entry.get("module_kwargs", {})
+        self.cuda = 'cuda' in self.get_value_from_config('device')
+        self.module = self.load_module(
+            config_entry['module'],
+            module_args,
+            module_kwargs,
+            config_entry.get('checkpoint'),
+            config_entry.get('state_key'),
+            config_entry.get("python_path")
+        )
+
+        self._batch = self.get_value_from_config('batch')
+        # torch modules does not have input information
+        self._generate_inputs()
+        self.output_names = self.get_value_from_config('output_names') or ['output']
+
+    def _generate_inputs(self):
+        config_inputs = self.config.get('inputs')
+        if not config_inputs:
+            self._inputs = {'input': (self.batch, ) + (-1, ) * 3}
+            return
+        input_shapes = OrderedDict()
+        for input_description in config_inputs:
+            input_shapes[input_description['name']] = input_description.get('shape', (self.batch, ) + (-1, ) * 3)
+        self._inputs = input_shapes
+
+    @property
+    def inputs(self):
+        return self._inputs
+
+    @property
+    def batch(self):
+        return self._batch
+
+    @property
+    def output_blob(self):
+        return next(iter(self.output_names))
+
+    def load_module(self, model_cls, module_args, module_kwargs, checkpoint=None, state_key=None, python_path=None):
+        module_parts = model_cls.split(".")
+        model_cls = module_parts[-1]
+        model_path = ".".join(module_parts[:-1])
+        with append_to_path(python_path):
+            model_cls = importlib.import_module(model_path).__getattribute__(model_cls)
+            module = model_cls(*module_args, **module_kwargs)
+            if checkpoint:
+                checkpoint = self._torch.load(checkpoint)
+                state = checkpoint if not state_key else checkpoint[state_key]
+                module.load_state_dict(state, strict=False)
+            if self.cuda:
+                module.cuda()
+            else:
+                module.cpu()
+            module.eval()
+            return module
+
+    def fit_to_input(self, data, layer_name, layout, precision):
+        data = np.transpose(data, layout)
+        tensor = self._torch.from_numpy(data.astype(np.float32 if not precision else precision))
+        if self.cuda:
+            tensor = tensor.cuda()
+        with self._torch.no_grad():
+            return self._torch.autograd.Variable(tensor)
+
+    def predict(self, inputs, metadata=None, **kwargs):
+        results = []
+        for batch_input in inputs:
+            outputs = list(self.module(*batch_input.values()))
+            result_dict = {
+                output_name: res.data.cpu().numpy() if self.cuda else res.data.numpy()
+                for output_name, res in zip(self.output_names, outputs)
+            }
+            results.append(result_dict)
+            for meta_ in metadata:
+                meta_['input_shape'] = {key: list(data.shape) for key, data in batch_input.items()}
+
+        return results
+
+    def predict_async(self, *args, **kwargs):
+        raise ValueError('PyTorch Launcher does not support async mode yet')
+
+    def release(self):
+        del self.module
+
+
+@contextmanager
+def append_to_path(path):
+    if path:
+        sys.path.append(str(path))
+
+    yield
+
+    if path:
+        sys.path.remove(str(path))
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher_readme.md
new file mode 100644
index 00000000000..cdd2c49f46a
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/launcher/pytorch_launcher_readme.md
@@ -0,0 +1,36 @@
+# How to configure PyTorch launcher
+
+For enabling PyTorch launcher you need to add `framework: pytorch` in launchers section of your configuration file and provide following parameters:
+
+* `device` - specifies which device will be used for infer (`cpu`, `cuda` and so on).
+* `module`- pytorch network module for loading.
+* `checkpoint` - pre-trained model checkpoint (Optional).
+* `python_path` - appendix for PYTHONPATH for making network module visible in current python environment (Optional).
+* `module_args` - list of positional arguments for network module (Optional).
+* `module_kwargs` - dictionary (`key`: `value` where `key` is argument name, `value` is argument value) which represent network module keyword arguments.
+* `adapter` - approach how raw output will be converted to representation of dataset problem, some adapters can be specific to framework. You can find detailed instruction how to use adapters [here](../adapters/README.md).
+* `batch` - batch size for running model (Optional, default 1).
+In turn if you model has several inputs you need specify them in config, using specific parameter: `inputs`.
+Each input description should has following info:
+  * `name` - input layer name in network
+  * `type` - type of input values, it has impact on filling policy. Available options:
+    * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
+    * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
+    * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
+  * `shape` - shape of input layer described as comma-separated of all dimensions size except batch size.
+    Optionally you can determine `layout` in case when your model was trained with non-standard data layout (For PyTorch default layout is `NCHW`) and`precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
+If you model has several outputs you also need specify their names in config for ability to get their values in adapter using option `output_names`.
+
+PyTorch launcher config example (demonstrates how to run AlexNet model from [torchvision](https://pytorch.org/docs/stable/torchvision/models.html)):
+
+```yml
+launchers:
+  - framework: pytorch
+    device: CPU
+    module: orchvision.models.alexnet
+
+    module_kwargs:
+      pretrained: True
+
+    adapter: classification
+```
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher.py
index f41e9aad8a7..45aee68cd7c 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher.py
@@ -17,9 +17,10 @@
 import re
 from pathlib import Path
 import tensorflow as tf
-
-from .launcher import Launcher
-from ..config import BaseField, ListField, PathField, StringField, ConfigError, ConfigValidator
+from tensorflow.python.saved_model import tag_constants
+from .launcher import Launcher, LauncherConfigValidator
+from ..config import BaseField, ListField, PathField, StringField, ConfigError
+from ..utils import contains_any, contains_all
 
 
 class TFLauncher(Launcher):
@@ -29,7 +30,10 @@ class TFLauncher(Launcher):
     def parameters(cls):
         parameters = super().parameters()
         parameters.update({
-            'model': PathField(is_directory=False, description="Path to model file."),
+            'model': PathField(
+                is_directory=False, description="Path to model file (frozen graph of checkpoint meta).", optional=True
+            ),
+            'saved_model_dir': PathField(is_directory=True, optional=True, description='Path to saved model directory'),
             'device': StringField(
                 choices=('cpu', 'gpu'), default='cpu', optional=True, description="Device name: cpu or gpu"),
             'inputs': BaseField(optional=True, description="Inputs."),
@@ -42,27 +46,40 @@ def parameters(cls):
     def __init__(self, config_entry, *args, **kwargs):
         super().__init__(config_entry, *args, **kwargs)
         self.default_layout = 'NHWC'
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
 
-        tf_launcher_config = ConfigValidator('TF_Launcher', fields=self.parameters())
+        tf_launcher_config = LauncherConfigValidator(
+            'TF_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading
+        )
         tf_launcher_config.validate(self.config)
-        self._config_outputs = self.get_value_from_config('output_names')
 
-        self._graph = self._load_graph(str(self.get_value_from_config('model')))
+        if not self._delayed_model_loading:
+            if not contains_any(self.config, ['model', 'saved_model_dir']):
+                raise ConfigError('model or saved model directory should be provided')
+
+            if contains_all(self.config, ['model', 'saved_model']):
+                raise ConfigError('only one option: model or saved_model_dir should be provided')
 
-        self._outputs_names = self._get_outputs_names(self._graph, self._config_outputs)
+            self._config_outputs = self.get_value_from_config('output_names')
+            if 'model' in self.config:
+                self._graph = self._load_graph(str(self.get_value_from_config('model')))
+            else:
+                self._graph = self._load_graph(str(self.get_value_from_config('saved_model_dir')), True)
 
-        self._outputs_tensors = []
-        self.node_pattern = 'import/{}:0'
-        for output in self._outputs_names:
-            try:
-                tensor = self._graph.get_tensor_by_name('import/{}:0'.format(output))
-            except KeyError:
+            self._outputs_names = self._get_outputs_names(self._graph, self._config_outputs)
+
+            self._outputs_tensors = []
+            self.node_pattern = 'import/{}:0'
+            for output in self._outputs_names:
                 try:
-                    tensor = self._graph.get_tensor_by_name('{}:0'.format(output))
-                    self.node_pattern = '{}:0'
+                    tensor = self._graph.get_tensor_by_name('import/{}:0'.format(output))
                 except KeyError:
-                    raise ConfigError('model graph does not contains output {}'.format(output))
-            self._outputs_tensors.append(tensor)
+                    try:
+                        tensor = self._graph.get_tensor_by_name('{}:0'.format(output))
+                        self.node_pattern = '{}:0'
+                    except KeyError:
+                        raise ConfigError('model graph does not contains output {}'.format(output))
+                self._outputs_tensors.append(tensor)
 
         self.device = '/{}:0'.format(self.get_value_from_config('device').lower())
 
@@ -113,18 +130,14 @@ def output_blob(self):
     def predict_async(self, *args, **kwargs):
         raise ValueError('TensorFlow Launcher does not support async mode yet')
 
-    def _load_graph(self, model):
+    def _load_graph(self, model, saved_model=False):
+        if saved_model:
+            return self._load_saved_model(model)
+
         if 'meta' in Path(model).suffix:
             return self._load_graph_using_meta(model)
 
-        with tf.gfile.GFile(model, 'rb') as file:
-            graph_def = tf.GraphDef()
-            graph_def.ParseFromString(file.read())
-
-        with tf.Graph().as_default() as graph:
-            tf.import_graph_def(graph_def)
-
-        return graph
+        return self._load_frozen_graph(model)
 
     def _load_graph_using_meta(self, model):
         tf.reset_default_graph()
@@ -145,6 +158,27 @@ def _load_graph_using_meta(self, model):
             tf.import_graph_def(graph_def, name='')
         return graph
 
+    @staticmethod
+    def _load_frozen_graph(model):
+        with tf.gfile.GFile(model, 'rb') as file:
+            graph_def = tf.GraphDef()
+            graph_def.ParseFromString(file.read())
+
+        with tf.Graph().as_default() as graph:
+            tf.import_graph_def(graph_def)
+
+        return graph
+
+    @staticmethod
+    def _load_saved_model(model_dir):
+        graph = tf.Graph()
+
+        with graph.as_default():
+            with tf.Session() as sess:
+                tf.saved_model.loader.load(sess, [tag_constants.SERVING], model_dir)
+
+        return graph
+
     def _get_graph_inputs(self, graph, config_inputs=None):
         inputs_ops = {'Placeholder'}
         inputs = [x for x in graph.as_graph_def().node if not x.input and x.op in inputs_ops]
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher_readme.md
index 640d2a83351..3a7ab908773 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/tf_launcher_readme.md
@@ -16,7 +16,8 @@ Each input description should has following info:
     * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
-    Optionally you can determine `shape` of input and `layout` in case when your model was trained with non-standard data layout (For TensorFlow default layout is `NHWC`).
+    Optionally you can determine `shape` of input and `layout` in case when your model was trained with non-standard data layout (For TensorFlow default layout is `NHWC`)
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
 TensorFlow launcher config example:
 
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher.py b/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher.py
index e084f4a950b..84b17bb1f4b 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher.py
+++ b/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher.py
@@ -15,10 +15,14 @@
 """
 
 import tensorflow as tf
-
 from .launcher import Launcher, LauncherConfigValidator, ListInputsField
 from ..config import PathField, StringField
 
+try:
+    tf_lite = tf.lite
+except AttributeError:
+    tf_lite = tf.contrib.lite
+
 
 class TFLiteLauncher(Launcher):
     __provider__ = 'tf_lite'
@@ -33,21 +37,24 @@ def parameters(cls):
         })
         return parameters
 
-    def __init__(self, config_entry, adapter, *args, **kwargs):
-        super().__init__(config_entry, adapter, *args, **kwargs)
+    def __init__(self, config_entry, *args, **kwargs):
+        super().__init__(config_entry, *args, **kwargs)
         self.default_layout = 'NHWC'
+        self._delayed_model_loading = kwargs.get('delayed_model_loading', False)
 
-        tf_launcher_config = LauncherConfigValidator('TF_Lite_Launcher', fields=self.parameters())
+        tf_launcher_config = LauncherConfigValidator(
+            'TF_Lite_Launcher', fields=self.parameters(), delayed_model_loading=self._delayed_model_loading
+        )
         tf_launcher_config.validate(self.config)
-
-        self._interpreter = tf.contrib.lite.Interpreter(model_path=str(self.config['model']))
-        self._interpreter.allocate_tensors()
-        self._input_details = self._interpreter.get_input_details()
-        self._output_details = self._interpreter.get_output_details()
-        self._inputs = {input_layer['name']: input_layer for input_layer in self._input_details}
+        if not self._delayed_model_loading:
+            self._interpreter = tf_lite.Interpreter(model_path=str(self.config['model']))
+            self._interpreter.allocate_tensors()
+            self._input_details = self._interpreter.get_input_details()
+            self._output_details = self._interpreter.get_output_details()
+            self._inputs = {input_layer['name']: input_layer for input_layer in self._input_details}
         self.device = '/{}:0'.format(self.config.get('device', 'cpu').lower())
 
-    def predict(self, inputs, metadata, *args, **kwargs):
+    def predict(self, inputs, metadata=None, **kwargs):
         """
         Args:
             inputs: dictionary where keys are input layers names and values are data for them.
@@ -64,6 +71,10 @@ def predict(self, inputs, metadata, *args, **kwargs):
             res = {output['name']: self._interpreter.get_tensor(output['index']) for output in self._output_details}
             results.append(res)
 
+            if metadata is not None:
+                for meta_ in metadata:
+                    meta_['input_shape'] = self.inputs_info_for_meta()
+
         return results
 
     @property
@@ -72,13 +83,13 @@ def batch(self):
 
     @property
     def inputs(self):
-        return self._inputs.items()
+        return self._inputs
 
     def release(self):
         del self._interpreter
 
     def predict_async(self, *args, **kwargs):
-        raise ValueError('Tensorflow Lite Launcher does not support async mode yet')
+        raise ValueError('TensorFlow Lite Launcher does not support async mode yet')
 
     @property
     def output_blob(self):
diff --git a/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher_readme.md b/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher_readme.md
index 4e96147a393..a6c50982269 100644
--- a/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher_readme.md
+++ b/tools/accuracy_checker/accuracy_checker/launcher/tf_lite_launcher_readme.md
@@ -15,7 +15,8 @@ Each input description should has following info:
     * `CONST_INPUT` - input will be filled using constant provided in config. It also requires to provide `value`.
     * `IMAGE_INFO` - specific key for setting information about input shape to layer (used in Faster RCNN based topologies). You do not need provide `value`, because it will be calculated in runtime. Format value is `Nx[H, W, S]`, where `N` is batch size, `H` - original image height, `W` - original image width, `S` - scale of original image (default 1).
     * `INPUT` - network input for main data stream (e. g. images). If you have several data inputs, you should provide regular expression for identifier as `value` for specifying which one data should be provided in specific input.
-    Optionally you can determine `shape` of input and `layout` in case when your model was trained with non-standard data layout (For TensorFlow Lite default layout is `NHWC`).
+    Optionally you can determine `shape` of input and `layout` in case when your model was trained with non-standard data layout (For TensorFlow Lite default layout is `NHWC`) 
+    and `precision` (Supported precisions: `FP32` - float, `FP16` - signed shot, `U8`  - unsigned char, `U16` - unsigned short int, `I8` - signed char, `I16` - short int, `I32` - int, `I64` - long int).
 
 TensorFlow Lite launcher config example:
 
diff --git a/tools/accuracy_checker/accuracy_checker/logging.py b/tools/accuracy_checker/accuracy_checker/logging.py
index dcc80ce268a..19f4762fa3b 100644
--- a/tools/accuracy_checker/accuracy_checker/logging.py
+++ b/tools/accuracy_checker/accuracy_checker/logging.py
@@ -102,6 +102,10 @@ def error(msg, *args, **kwargs):
     _default_logger.error(msg, *args, **kwargs)
 
 
+def exception(exc, *args, **kwargs):
+    _default_logger.exception(str(exc), *args, **kwargs)
+
+
 def warning(msg, *args, raise_warning=True, **kwargs):
     if raise_warning:
         warnings.warn(msg)
diff --git a/tools/accuracy_checker/accuracy_checker/main.py b/tools/accuracy_checker/accuracy_checker/main.py
index c50fd7c6994..a2bde722acc 100644
--- a/tools/accuracy_checker/accuracy_checker/main.py
+++ b/tools/accuracy_checker/accuracy_checker/main.py
@@ -14,6 +14,7 @@
 limitations under the License.
 """
 
+import sys
 from pathlib import Path
 from argparse import ArgumentParser
 from functools import partial
@@ -21,11 +22,17 @@
 import cv2
 
 from .config import ConfigReader
-from .logging import print_info, add_file_handler
-from .evaluators import ModelEvaluator, PipeLineEvaluator, get_processing_info
+from .logging import print_info, add_file_handler, exception
+from .evaluators import ModelEvaluator, PipeLineEvaluator, ModuleEvaluator
 from .progress_reporters import ProgressReporter
 from .utils import get_path, cast_to_bool
 
+EVALUATION_MODE = {
+    'models': ModelEvaluator,
+    'pipelines': PipeLineEvaluator,
+    'evaluations': ModuleEvaluator
+}
+
 
 def build_arguments_parser():
     parser = ArgumentParser(description='Deep Learning accuracy validation framework', allow_abbrev=False)
@@ -45,21 +52,18 @@ def build_arguments_parser():
         '-m', '--models',
         help='prefix path to the models and weights',
         type=partial(get_path, is_directory=True),
-        default=Path.cwd(),
         required=False
     )
     parser.add_argument(
         '-s', '--source',
         help='prefix path to the data source',
         type=partial(get_path, is_directory=True),
-        default=Path.cwd(),
         required=False
     )
     parser.add_argument(
         '-a', '--annotations',
         help='prefix path to the converted annotations and datasets meta data',
         type=partial(get_path, is_directory=True),
-        default=Path.cwd(),
         required=False
     )
     parser.add_argument(
@@ -79,7 +83,6 @@ def build_arguments_parser():
         '-b', '--bitstreams',
         help='prefix path to bitstreams folder',
         type=partial(get_path, file_or_directory=True),
-        default=Path.cwd(),
         required=False
     )
     parser.add_argument(
@@ -111,6 +114,14 @@ def build_arguments_parser():
         # defined in model_conversion.py
         required=False
     )
+    parser.add_argument(
+        '--transformations_config_dir',
+        help='path to directory with Model Optimizer transformations configuration files',
+        type=partial(get_path, is_directory=True),
+        # there is no default value because if user did not specify it we use specific location
+        # defined in model_conversion.py
+        required=False
+    )
     parser.add_argument(
         '--tf_obj_detection_api_pipeline_config_path',
         help='path to directory with tensorflow object detection api pipeline configuration files for model optimizer',
@@ -186,11 +197,19 @@ def build_arguments_parser():
         choices=['LOG_NONE', 'LOG_WARNING', 'LOG_INFO', 'LOG_DEBUG'],
         default='LOG_WARNING'
     )
+    parser.add_argument(
+        '--deprecated_ir_v7',
+        help='Allow generation IR v7 via Model Optimizer',
+        required=False,
+        default=False,
+        type=cast_to_bool
+    )
 
     return parser
 
 
 def main():
+    return_code = 0
     args = build_arguments_parser().parse_args()
     progress_bar_provider = args.progress if ':' not in args.progress else args.progress.split(':')[0]
     progress_reporter = ProgressReporter.provide(progress_bar_provider, None, print_interval=args.progress_interval)
@@ -198,39 +217,22 @@ def main():
         add_file_handler(args.log_file)
 
     config, mode = ConfigReader.merge(args)
-    if mode == 'models':
-        model_evaluation_mode(config, progress_reporter, args)
-    else:
-        pipeline_evaluation_mode(config, progress_reporter, args)
-
-
-def model_evaluation_mode(config, progress_reporter, args):
-    for model in config['models']:
-        for launcher_config in model['launchers']:
-            for dataset_config in model['datasets']:
-                print_processing_info(
-                    model['name'],
-                    launcher_config['framework'],
-                    launcher_config['device'],
-                    launcher_config.get('tags'),
-                    dataset_config['name']
-                )
-                model_evaluator = ModelEvaluator.from_configs(launcher_config, dataset_config)
-                progress_reporter.reset(model_evaluator.dataset.size)
-                model_evaluator.dataset_processor(args.stored_predictions, progress_reporter=progress_reporter)
-                model_evaluator.compute_metrics(ignore_results_formatting=args.ignore_result_formatting)
-
-                model_evaluator.release()
-
-
-def pipeline_evaluation_mode(config, progress_reporter, args):
-    for pipeline_config in config['pipelines']:
-        print_processing_info(*get_processing_info(pipeline_config))
-        evaluator = PipeLineEvaluator.from_configs(pipeline_config['stages'])
-        evaluator.process_dataset(args.stored_predictions, progress_reporter=progress_reporter)
-        evaluator.compute_metrics(ignore_results_formatting=args.ignore_result_formatting)
-
-        evaluator.release()
+    evaluator_class = EVALUATION_MODE.get(mode)
+    if not evaluator_class:
+        raise ValueError('Unknown evaluation mode')
+    for config_entry in config[mode]:
+        try:
+            processing_info = evaluator_class.get_processing_info(config_entry)
+            print_processing_info(*processing_info)
+            evaluator = evaluator_class.from_configs(config_entry)
+            evaluator.process_dataset(args.stored_predictions, progress_reporter=progress_reporter)
+            evaluator.compute_metrics(ignore_results_formatting=args.ignore_result_formatting)
+            evaluator.release()
+        except Exception as e:  # pylint:disable=W0703
+            exception(e)
+            return_code = 1
+            continue
+    sys.exit(return_code)
 
 
 def print_processing_info(model, launcher, device, tags, dataset):
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/README.md b/tools/accuracy_checker/accuracy_checker/metrics/README.md
index b87de8f67f9..7a80e8b0a74 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/README.md
+++ b/tools/accuracy_checker/accuracy_checker/metrics/README.md
@@ -1,24 +1,27 @@
 # Metrics
 
-For correct work metrics require specific representation format. 
-(e. g. map expects detection annotation and detection prediction for evaluation). 
+For correct work metrics require specific representation format.
+(e. g. map expects detection annotation and detection prediction for evaluation).
 
 In case when you use complicated representation located in representation container, you need to add options `annotation_source` and `prediction_source` in configuration file to
 select specific representation, another way metric calculation possible only if container has only one suitable representation and will be resolved automatically.
 `annotation_source` and `prediction_source` should contain only one annotation identifier and output layer name respectively.
 You may optionally provide `reference` field for metric, if you want calculated metric tested against specific value (i.e. reported in canonical paper) and acceptable `threshold` for metric deviation from reference value.
 
-Every metric has parameters available for configuration. 
+Every metric has parameters available for configuration.
 
 Accuracy Checker supports following set of metrics:
 
 * `accuracy` - classification accuracy metric, defined as the number of correct predictions divided by the total number of predictions.
-Supported representation: `ClassificationAnnotation`, `ClassificationPrediction`
+Supported representation: `ClassificationAnnotation`, `TextClassificationAnnotation`, `ClassificationPrediction`.
   * `top_k` - the number of classes with the highest probability, which will be used to decide if prediction is correct.
 * `accuracy_per_class` - classification accuracy metric which represents results for each class. Supported representation: `ClassificationAnnotation`, `ClassificationPrediction`.
   * `top_k` - the number of classes with the highest probability, which will be used to decide if prediction is correct.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map (Optional, should be provided if different from default).
 * `character_recognition_accuracy` - accuracy metric for character recognition task. Supported representation: `CharacterRecognitionAnnotation`, `CharacterRecognitionPrediction`.
+* `classification_f1-score` - [F1 score](https://en.wikipedia.org/wiki/F1_score) metric for classification task. Supported representation: `ClassificationAnnotation`, `TextClassificationAnnotation`, `ClassificationPrediction`.
+* `label_map` - the field in annotation metadata, which contains dataset label map (Optional, should be provided if different from default).
+* `metthews_correlation_coef` - [Matthews correlation coefficient (MCC)](https://en.wikipedia.org/wiki/Matthews_correlation_coefficient) for binary classification. Supported representation: `ClassificationAnnotation`, `TextClassificationAnnotation`, `ClassificationPrediction`.
 * `map` - mean average precision. Supported representations: `DetectionAnnotation`, `DetectionPrediction`.
   * `overlap_threshold` - minimal value for intersection over union that allows to make decision that prediction bounding box is true positive.
   * `overlap_method` - method for calculation bbox overlap. You can choose between intersection over union (`iou`), defined as area of intersection divided by union of annotation and prediction boxes areas, and intersection over area (`ioa`), defined as area of intersection divided by ara of prediction box.
@@ -26,7 +29,7 @@ Supported representation: `ClassificationAnnotation`, `ClassificationPrediction`
   * `ignore_difficult` - allows to ignore difficult annotation boxes in metric calculation. In this case, difficult boxes are filtered annotations from postprocessing stage.
   * `distinct_conf` - select only values for distinct confidences.
   * `allow_multiple_matches_per_ignored` - allows multiple matches per ignored.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `integral` - integral type for average precision calculation. Pascal VOC `11point` and `max` approaches are available.
 * `miss_rate` - miss rate metric of detection models.  Supported representations: `DetectionAnnotation`, `DetectionPrediction`.
   * `overlap_threshold` - minimal value for intersection over union that allows to make decision that prediction bounding box is true positive.
@@ -35,7 +38,7 @@ Supported representation: `ClassificationAnnotation`, `ClassificationPrediction`
   * `ignore_difficult` - allows to ignore difficult annotation boxes in metric calculation. In this case, difficult boxes are filtered annotations from postprocessing stage.
   * `distinct_conf` - select only values for distinct confidences.
   * `allow_multiple_matches_per_ignored` - allows multiple matches per ignored.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `fppi_level` - false positive per image level.
 * `recall` - recall metric of detection models. Supported representations: `DetectionAnnotation`, `DetectionPrediction`.
   * `overlap_threshold` - minimal value for intersection over union that allows to make decision that prediction bounding box is true positive.
@@ -44,12 +47,12 @@ Supported representation: `ClassificationAnnotation`, `ClassificationPrediction`
   * `ignore_difficult` - allows to ignore difficult annotation boxes in metric calculation. In this case, difficult boxes are filtered annotations from postprocessing stage.
   * `distinct_conf` - select only values for distinct confidences.
   * `allow_multiple_matches_per_ignored` - allows multiple matches per ignored.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map (Optional, should be provided if different from default).
 * `detection_accuracy` - accuracy for detection models. Supported representations: `DetectionAnnotation`, `DetectionPrediction`.
   * `overlap_threshold` - minimal value for intersection over union that allows to make decision that prediction bounding box is true positive.
   * `overlap_method` - method for calculation bbox overlap. You can choose between intersection over union (`iou`), defined as area of intersection divided by union of annotation and prediction boxes areas, and intersection over area (`ioa`), defined as area of intersection divided by ara of prediction box.
   * `include_boundaries` - allows include boundaries in overlap calculation process. If it is True then width and height of box is calculated by max - min + 1.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `use_normalization` - allows to normalize confusion_matrix for metric calculation.
 * `segmentation_accuracy` - pixel accuracy for semantic segmentation models. Supported representations: `SegmentationAnnotation`, `SegmentationPrediction`.
   * `use_argmax` - allows to use argmax for prediction mask.
@@ -71,7 +74,7 @@ More detailed information about calculation segmentation metrics you can find [h
 * `pairwise_accuracy` - pairwise accuracy for object reidentification. Supported representations: `ReIdentificationClassificationAnnotation`, `ReIdentificationPrediction`.
   * `min_score` - min score for determining that objects are different. You can provide value or use `train_median` value which will be calculated if annotations has training subset.
 * `pairwise_accuracy_subsets` - object reidentification pairwise accuracy with division dataset on test and train subsets for calculation mean score. Supported representations: `ReIdentificationClassificationAnnotation`, `ReIdentificationPrediction`.
-  * `subset_number` - number of subsets for separating. 
+  * `subset_number` - number of subsets for separating.
 * `mae` - [Mean Absolute Error](https://en.wikipedia.org/wiki/Mean_absolute_error). Supported representations: `RegressionAnnotation`, `RegressionPrediction`.
 * `mae_on_intervals` - Mean Absolute Error estimated magnitude for specific value range. Supported representations: `RegressionAnnotation`, `RegressionPrediction`.
   * `intervals` - comma-separated list of interval boundaries.
@@ -92,19 +95,19 @@ More detailed information about calculation segmentation metrics you can find [h
   * `calculate_std` - allows calculation of standard deviation (default value: `False`)
   * `percentile` - calculate error rate for given percentile.
 * `psnr` - [Peak signal to noise ratio](https://en.wikipedia.org/wiki/Peak_signal-to-noise_ratio). Supported representations: `SuperResolutionAnnotation`, `SuperResolutionPrediction`.
-  * `color_order` - the field specified which color order `BGR` or `RGB` will be used during metric calculation (Optional. Default value is RGB). 
+  * `color_order` - the field specified which color order `BGR` or `RGB` will be used during metric calculation (Optional. Default value is RGB).
 * `angle_error` - Mean angle error and Standard deviation of angle error for gaze estimation. Supported representations: `GazeVectorAnnotation`, `GazeVectorPrediction`.
 * `multi_accuracy` - accuracy for multilabel recognition task. Supported representations: `MultiLabelRecognitionAnnotation`, `MultiLabelRecognitionPrediction`.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map (Optional, should be provided if different from default).
   * `calculate_average` - allows calculation of average accuracy (default value: `True`).
 * `multi_precision` - precision metric for multilabel recognition. Supported representations: `MultiLabelRecognitionAnnotation`, `MultiLabelRecognitionPrediction`.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `calculate_average` - allows calculation of average precision (default value: `True`).
 * `multi_recall` - recall metric for multilabel recognition. Supported representations: `MultiLabelRecognitionAnnotation`, `MultiLabelRecognitionPrediction`.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `calculate_average` - allows calculation of average recall (default value: `True`).
 * `f1_score` - [F score](https://en.wikipedia.org/wiki/F1_score) metric for multilabel recognition. Supported representations: `MultiLabelRecognitionAnnotation`, `MultiLabelRecognitionPrediction`.
-  * `label_map` - the field in annotation metadata, which contains dataset label map.
+  * `label_map` - the field in annotation metadata, which contains dataset label map  (Optional, should be provided if different from default).
   * `calculate_average` - allows calculation of average f-score (default value: `True`).
 * `focused_text_hmean` - Harmonic mean of precision and recall for focused scene text detection task introduced in [Robust Reading Competition challenge 2](https://rrc.cvc.uab.es/?ch=2&com=introduction). Supported representations: `TextDetectionAnnotation`, `TextDetectionPrediction`.
   * `ignore_difficult` - allows to ignore difficult ground truth text polygons in metric calculation.
@@ -148,14 +151,23 @@ More detailed information about calculation segmentation metrics you can find [h
 * `coco_recall` - MS COCO Average Recall metric for keypoints recognition and object detection tasks. Supported representations: `PoseEstimationAnnotation`, `PoseEstimationPrediction`, `DetectionAnnotation`, `DetectionPrediction`.
   * `max_detections` - max number of predicted results per image. If you have more predictions,the results with minimal confidence will be ignored.
   * `threshold` - intersection over union threshold. You can specify one value or comma separated range of values. This parameter supports precomputed values for standard COCO thresholds (`.5`, `.75`, `.5:.05:.95`).
+* `coco_keypoints_precision` - MS COCO Average Precision metric for keypoints recognition task. Supported representations: `PoseEstimationAnnotation`, `PoseEstimationPrediction`.
+  * `max_detections` - max number of predicted results per image. If you have more predictions,the results with minimal confidence will be ignored.
+  * `threshold` - intersection over union threshold. You can specify one value or comma separated range of values. This parameter supports precomputed values for standard COCO thresholds (`.5`, `.75`, `.5:.05:.95`).
+* `coco_keypoints_recall` - MS COCO Average Recall metric for keypoints recognition task. Supported representations: `PoseEstimationAnnotation`, `PoseEstimationPrediction`.
+  * `max_detections` - max number of predicted results per image. If you have more predictions,the results with minimal confidence will be ignored.
+  * `threshold` - intersection over union threshold. You can specify one value or comma separated range of values. This parameter supports precomputed values for standard COCO thresholds (`.5`, `.75`, `.5:.05:.95`).
 * `hit_ratio` - metric for recommendation system evaluation. Supported representations: `HitRatioAnnotation`, `HitRatioPrediction`.
   * `top_k` - definition of number elements in rank list (optional, default 10).
 * `ndcg` - [Normalized Discounted Cumulative Gain](https://en.wikipedia.org/wiki/Discounted_cumulative_gain). Supported representations: `HitRatioAnnotation`, `HitRatioPrediction`.
   * `top_k` - definition of number elements in rank list (optional, default 10).
 * `dice` - [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient). Supported representations: `BrainTumorSegmentationAnnotation, BrainTumorSegmentationPrediction`.
-* `dice_index` - [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient). Supported representations: `BrainTumorSegmentationAnnotation, BrainTumorSegmentationPrediction`. Supports result representation for multiple classes. Metric represents result for each class if `label_map` for used dataset is provided, otherwise it represents overall result. For `brats_numpy` converter file with labels set in `labels_file` tag.
-  * `mean` - allows calculation mean value (default - `True`)
-  * `median` - allows calculation median value (default - `False`)
+* `dice_index` - [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient). Supported representations: `BrainTumorSegmentationAnnotation, BrainTumorSegmentationPrediction`, `SegmentationAnnotation, SegmentationPrediction`. Supports result representation for multiple classes. Metric represents result for each class if `label_map` for used dataset is provided, otherwise it represents overall result. For `brats_numpy` converter file with labels set in `labels_file` tag.
+  * `mean` - allows calculation mean value (default - `True`).
+  * `median` - allows calculation median value (default - `False`).
 * `bleu` - [Bilingual Evaluation Understudy](https://en.wikipedia.org/wiki/BLEU). Supperted representations: `MachineTranslationAnnotation`, `MachineTranslationPrediction`.
   * `smooth` - Whether or not to apply Lin et al. 2004 smoothing.
   *  `max_order` - Maximum n-gram order to use when computing BLEU score. (Optional, default 4).
+* `f1` - F1-score for question answering task. Supported representations: `QuestionAnsweringAnnotation`, `QuestionAnsweringPrediction`.
+* `exact_match` - Exact matching (EM) metric for question answering task. Supported representations: `QuestionAnsweringAnnotation`, `QuestionAnsweringPrediction`.
+* `mpjpe_multiperson` - [Mean Per Joint Position Error](http://vision.imar.ro/human3.6m/pami-h36m.pdf) extended for multi-person case. Supported representations: `PoseEstimation3dAnnotation`, `PoseEstimation3dPrediction`. As the first step, correspondence between ground truth and prediction skeletons is established for each image. Then MPJPE is computed for each ground truth and prediction pair. The error is averaged over poses in each frame, then over all frames.
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/__init__.py b/tools/accuracy_checker/accuracy_checker/metrics/__init__.py
index 24cd1ca6773..f25a7e013c9 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/__init__.py
@@ -14,9 +14,16 @@
 limitations under the License.
 """
 
-from .metric_executor import MetricsExecutor, Metric
-
-from .classification import ClassificationAccuracy, ClassificationAccuracyClasses, ClipAccuracy
+from .metric_executor import MetricsExecutor
+from .metric import Metric, PerImageMetricResult
+
+from .classification import (
+    ClassificationAccuracy,
+    ClassificationAccuracyClasses,
+    ClipAccuracy,
+    ClassificationF1Score,
+    MetthewsCorrelation
+)
 from .detection import (DetectionMAP, MissRate, Recall, DetectionAccuracyMetric)
 from .reid import CMCScore, ReidMAP, PairwiseAccuracy, PairwiseAccuracySubsets
 from .semantic_segmentation import SegmentationAccuracy, SegmentationIOU, SegmentationMeanAccuracy, SegmentationFWAcc
@@ -47,25 +54,31 @@
     IncidentalSceneTextLocalizationRecall,
     IncidentalSceneTextLocalizationHMean
 )
-from .coco_metrics import MSCOCOAveragePrecision, MSCOCORecall
+from .coco_metrics import MSCOCOAveragePrecision, MSCOCORecall, MSCOCOKeypointsPrecision, MSCOCOKeypointsRecall
 from .coco_orig_metrics import (
     MSCOCOorigAveragePrecision,
     MSCOCOorigRecall,
 
     MSCOCOOrigSegmAveragePrecision,
-    MSCOCOorigSegmRecall
+    MSCOCOorigSegmRecall,
+
+    MSCOCOOrigKeyPointsAveragePrecision,
 )
 from .hit_ratio import HitRatioMetric, NDSGMetric
 from .machine_translation import BilingualEvaluationUnderstudy
+from .question_answering import ExactMatchScore, ScoreF1
+from .mpjpe_multiperson import MpjpeMultiperson
 
 
 __all__ = [
     'Metric',
     'MetricsExecutor',
+    'PerImageMetricResult',
 
     'ClassificationAccuracy',
     'ClassificationAccuracyClasses',
     'ClipAccuracy',
+    'ClassificationF1Score',
 
     'DetectionMAP',
     'MissRate',
@@ -109,13 +122,21 @@
 
     'MSCOCOAveragePrecision',
     'MSCOCORecall',
+    'MSCOCOKeypointsPrecision',
+    'MSCOCOKeypointsRecall',
     'MSCOCOorigAveragePrecision',
     'MSCOCOorigRecall',
     'MSCOCOOrigSegmAveragePrecision',
     'MSCOCOorigSegmRecall',
+    'MSCOCOOrigKeyPointsAveragePrecision',
 
     'HitRatioMetric',
     'NDSGMetric',
 
-    'BilingualEvaluationUnderstudy'
+    'BilingualEvaluationUnderstudy',
+
+    'ScoreF1',
+    'ExactMatchScore',
+
+    'MpjpeMultiperson'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/average_meter.py b/tools/accuracy_checker/accuracy_checker/metrics/average_meter.py
index eaae62ab4c4..bd15cc7e6da 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/average_meter.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/average_meter.py
@@ -37,6 +37,12 @@ def update(self, annotation_val, prediction_val):
             self.accumulator += loss
             self.total_count += increment
 
+        if np.isscalar(loss):
+            loss = float(loss)
+        else:
+            loss = loss.astype(float)
+        return np.divide(loss, increment, out=np.zeros_like(loss), where=increment != 0)
+
     def evaluate(self):
         if self.total_count is None:
             return 0.0
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/character_recognition.py b/tools/accuracy_checker/accuracy_checker/metrics/character_recognition.py
index e4ffa16e4db..61cf7e28612 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/character_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/character_recognition.py
@@ -29,7 +29,8 @@ def configure(self):
         self.accuracy = AverageMeter(lambda annotation, prediction: int(annotation == prediction))
 
     def update(self, annotation, prediction):
-        self.accuracy.update(annotation.label, prediction.label)
+        return self.accuracy.update(annotation.label, prediction.label)
+
 
     def evaluate(self, annotations, predictions):
         return self.accuracy.evaluate()
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/classification.py b/tools/accuracy_checker/accuracy_checker/metrics/classification.py
index e5d504f7a7f..115b0cf612e 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/classification.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/classification.py
@@ -16,8 +16,8 @@
 
 import numpy as np
 
-from ..representation import ClassificationAnnotation, ClassificationPrediction
-from ..config import NumberField, StringField
+from ..representation import ClassificationAnnotation, ClassificationPrediction, TextClassificationAnnotation
+from ..config import NumberField, StringField, ConfigError
 from .metric import PerImageEvaluationMetric
 from .average_meter import AverageMeter
 
@@ -29,7 +29,7 @@ class ClassificationAccuracy(PerImageEvaluationMetric):
 
     __provider__ = 'accuracy'
 
-    annotation_types = (ClassificationAnnotation, )
+    annotation_types = (ClassificationAnnotation, TextClassificationAnnotation)
     prediction_types = (ClassificationPrediction, )
 
     @classmethod
@@ -54,7 +54,7 @@ def loss(annotation_label, prediction_top_k_labels):
         self.accuracy = AverageMeter(loss)
 
     def update(self, annotation, prediction):
-        self.accuracy.update(annotation.label, prediction.top_k(self.top_k))
+        return self.accuracy.update(annotation.label, prediction.top_k(self.top_k))
 
     def evaluate(self, annotations, predictions):
         return self.accuracy.evaluate()
@@ -70,7 +70,7 @@ class ClassificationAccuracyClasses(PerImageEvaluationMetric):
 
     __provider__ = 'accuracy_per_class'
 
-    annotation_types = (ClassificationAnnotation, )
+    annotation_types = (ClassificationAnnotation, TextClassificationAnnotation)
     prediction_types = (ClassificationPrediction, )
 
     @classmethod
@@ -89,8 +89,14 @@ def parameters(cls):
     def configure(self):
         self.top_k = self.get_value_from_config('top_k')
         label_map = self.get_value_from_config('label_map')
-        self.labels = self.dataset.metadata.get(label_map)
-        self.meta['names'] = list(self.labels.values())
+        if self.dataset.metadata:
+            self.labels = self.dataset.metadata.get(label_map)
+            if not self.labels:
+                raise ConfigError('accuracy per class metric requires label_map providing in dataset_meta'
+                                  'Please provide dataset meta file or regenerate annotation')
+        else:
+            raise ConfigError('accuracy per class metric requires dataset metadata'
+                              'Please provide dataset meta file or regenerate annotation')
 
         def loss(annotation_label, prediction_top_k_labels):
             result = np.zeros_like(list(self.labels.keys()))
@@ -107,9 +113,10 @@ def counter(annotation_label):
         self.accuracy = AverageMeter(loss, counter)
 
     def update(self, annotation, prediction):
-        self.accuracy.update(annotation.label, prediction.top_k(self.top_k))
+        return self.accuracy.update(annotation.label, prediction.top_k(self.top_k))
 
     def evaluate(self, annotations, predictions):
+        self.meta['names'] = list(self.labels.values())
         return self.accuracy.evaluate()
 
     def reset(self):
@@ -145,13 +152,15 @@ def update(self, annotation, prediction):
             self.video_accuracy.update(video_top_label, self.previous_video_label)
             self.video_avg_prob = AverageProbMeter()
 
-        self.video_avg_prob.update(annotation.label, prediction.scores)
+        video_avg = self.video_avg_prob.update(annotation.label, prediction.scores)
 
-        self.clip_accuracy.update(annotation.label, prediction.label)
+        clip_accuracy = self.clip_accuracy.update(annotation.label, prediction.label)
 
         self.previous_video_id = video_id
         self.previous_video_label = annotation.label
 
+        return [clip_accuracy, video_avg]
+
     def evaluate(self, annotations, predictions):
         self.meta['names'] = ['clip_accuracy', 'video_accuracy']
         return [self.clip_accuracy.evaluate(), self.video_accuracy.evaluate()]
@@ -160,3 +169,90 @@ def reset(self):
         self.clip_accuracy.reset()
         self.video_accuracy.reset()
         self.video_avg_prob.reset()
+
+
+class ClassificationF1Score(PerImageEvaluationMetric):
+    __provider__ = 'classification_f1-score'
+
+    annotation_types = (ClassificationAnnotation, TextClassificationAnnotation)
+    prediction_types = (ClassificationPrediction, )
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'label_map': StringField(optional=True, default='label_map', description="Label map.")
+        })
+        return parameters
+
+    def configure(self):
+        label_map = self.get_value_from_config('label_map')
+        if self.dataset.metadata:
+            self.labels = self.dataset.metadata.get(label_map)
+            if not self.labels:
+                raise ConfigError('classification_f1-score metric requires label_map providing in dataset_meta'
+                                  'Please provide dataset meta file or regenerate annotation')
+        else:
+            raise ConfigError('classification_f1-scores metric requires dataset metadata'
+                              'Please provide dataset meta file or regenerate annotation')
+        self.cm = np.zeros((len(self.labels), len(self.labels)))
+
+    def update(self, annotation, prediction):
+        self.cm[prediction.label] += 1
+        return annotation.label == prediction.label
+
+    def evaluate(self, annotations, predictions):
+        cm_diagonal = self.cm.diagonal()
+        cm_horizontal_sum = self.cm.sum(axis=1)
+        cm_vertical_sum = self.cm.sum(axis=0)
+        precision = np.divide(
+            cm_diagonal, cm_horizontal_sum, out=np.zeros_like(cm_diagonal, dtype=float), where=cm_horizontal_sum != 0
+        )
+        recall = np.divide(
+            cm_diagonal, cm_vertical_sum, out=np.zeros_like(cm_diagonal, dtype=float), where=cm_vertical_sum != 0
+        )
+        sum_precision_recall = precision + recall
+        f1_score = 2 * np.divide(
+            precision * recall, sum_precision_recall, out=np.zeros_like(cm_diagonal, dtype=float),
+            where=sum_precision_recall != 0
+        )
+        return f1_score if len(f1_score) == 2 else f1_score[0]
+
+    def reset(self):
+        self.cm = np.zeros((len(self.labels), len(self.labels)))
+
+
+class MetthewsCorrelation(PerImageEvaluationMetric):
+    __provider__ = 'metthews_correlation_coef'
+    annotation_types = (ClassificationAnnotation, TextClassificationAnnotation)
+    prediction_types = (ClassificationPrediction, )
+
+    def configure(self):
+        label_map = self.dataset.metadata.get('label_map', [])
+        if label_map and len(label_map) != 2:
+            raise ConfigError('metthews_correlation_coefficient applicable only for binary classification task')
+        self.reset()
+
+    def update(self, annotation, prediction):
+        if annotation.label and prediction.label:
+            self.tp += 1
+            return 1
+        if not annotation.label and not prediction.label:
+            self.tn += 1
+            return 1
+        if not annotation.label and prediction.label:
+            self.fp += 1
+            return 0
+        if annotation.label and not prediction.label:
+            self.fn += 1
+            return 0
+        return -1
+
+    def evaluate(self, annotations, predictions):
+        delimeter_sum = (self.tp + self.fp) * (self.tp + self.fn) * (self.tn + self.fp) * (self.tn + self.fn)
+        return ((self.tp * self.tn) - (self.fp * self.fn)) / np.sqrt(delimeter_sum) if delimeter_sum != 0 else -1
+
+    def reset(self):
+        self.tp = 0
+        self.tn = 0
+        self.fp = 0
+        self.fn = 0
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/coco_metrics.py b/tools/accuracy_checker/accuracy_checker/metrics/coco_metrics.py
index a33225bd8b4..9e39fe4ee1d 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/coco_metrics.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/coco_metrics.py
@@ -16,14 +16,14 @@
 
 from functools import singledispatch
 import numpy as np
-from ..config import NumberField, BaseField
+from ..config import NumberField, BaseField, ConfigError
 from ..representation import (
     DetectionPrediction,
     DetectionAnnotation,
     PoseEstimationPrediction,
     PoseEstimationAnnotation
 )
-from ..utils import get_or_parse_value
+from ..utils import get_or_parse_value, finalize_metric_result
 from .overlap import Overlap
 from .metric import PerImageEvaluationMetric
 
@@ -60,48 +60,60 @@ def parameters(cls):
     def configure(self):
         self.max_detections = self.get_value_from_config('max_detections')
         self.thresholds = get_or_parse_value(self.get_value_from_config('threshold'), COCO_THRESHOLDS)
-        label_map = self.dataset.metadata.get('label_map', [])
+        if not self.dataset.metadata:
+            raise ConfigError('coco metrics require dataset metadata providing in dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
+        label_map = self.dataset.metadata.get('label_map', {})
         self.labels = [
             label for label in label_map
             if label != self.dataset.metadata.get('background_label')
         ]
+        if not self.labels:
+            raise ConfigError('coco metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
         self.meta['names'] = [label_map[label] for label in self.labels]
         self.matching_results = [[] for _ in self.labels]
 
     def update(self, annotation, prediction):
         compute_iou, create_boxes = select_specific_parameters(annotation)
+        per_class_results = []
 
         for label_id, label in enumerate(self.labels):
             detections, scores, dt_difficult = prepare_predictions(prediction, label, self.max_detections)
             ground_truth, gt_difficult, iscrowd, boxes, areas = prepare_annotations(annotation, label, create_boxes)
             iou = compute_iou(ground_truth, detections, boxes, areas)
-            self.matching_results[label_id].append(
-                evaluate_image(
-                    ground_truth,
-                    gt_difficult,
-                    iscrowd,
-                    detections,
-                    dt_difficult,
-                    scores,
-                    iou,
-                    self.thresholds
-                    ))
+            eval_result = evaluate_image(
+                ground_truth, gt_difficult, iscrowd, detections, dt_difficult, scores, iou, self.thresholds
+            )
+            self.matching_results[label_id].append(eval_result)
+            per_class_results.append(eval_result)
+
+        return per_class_results
 
     def evaluate(self, annotations, predictions):
         pass
 
     def reset(self):
         self.matching_results = [[] for _ in self.labels]
+        label_map = self.dataset.metadata.get('label_map', {})
+        self.meta['names'] = [label_map[label] for label in self.labels]
 
 
 class MSCOCOAveragePrecision(MSCOCOBaseMetric):
     __provider__ = 'coco_precision'
 
+    def update(self, annotation, prediction):
+        per_class_matching = super().update(annotation, prediction)
+        return [
+            compute_precision_recall(self.thresholds, [per_class_matching[i]])[0] for i, _ in enumerate(self.labels)
+        ]
+
     def evaluate(self, annotations, predictions):
         precision = [
             compute_precision_recall(self.thresholds, self.matching_results[i])[0]
             for i, _ in enumerate(self.labels)
         ]
+        precision, self.meta['names'] = finalize_metric_result(precision, self.meta['names'])
 
         return precision
 
@@ -109,11 +121,118 @@ def evaluate(self, annotations, predictions):
 class MSCOCORecall(MSCOCOBaseMetric):
     __provider__ = 'coco_recall'
 
+    def update(self, annotation, prediction):
+        per_class_matching = super().update(annotation, prediction)
+        return [
+            compute_precision_recall(self.thresholds, [per_class_matching[i]])[1] for i, _ in enumerate(self.labels)
+        ]
+
+    def evaluate(self, annotations, predictions):
+        recalls = [
+            compute_precision_recall(self.thresholds, self.matching_results[i])[1]
+            for i, _ in enumerate(self.labels)
+        ]
+        recalls, self.meta['names'] = finalize_metric_result(recalls, self.meta['names'])
+
+        return recalls
+
+
+class MSCOCOKeypointsBaseMetric(MSCOCOBaseMetric):
+    annotation_types = (PoseEstimationAnnotation, )
+    prediction_types = (PoseEstimationPrediction, )
+
+    def update(self, annotation, prediction):
+        per_class_results = []
+        def _prepare_predictions(prediction, label, max_detections):
+            if prediction.size == 0:
+                return [], [], []
+            prediction_ids = prediction.labels == label
+            scores = prediction.scores[prediction_ids]
+            if np.size(scores) == 0:
+                return [], [], []
+            scores_ids = np.argsort(- scores, kind='mergesort')
+            difficult_box_mask = np.full(prediction.size, False)
+            difficult_box_mask[prediction.metadata.get('difficult_boxes', [])] = True
+            difficult_for_label = difficult_box_mask[prediction_ids]
+            if len(scores_ids) > max_detections:
+                scores_ids = scores_ids[:max_detections]
+            detections = prepare_keypoints(prediction, prediction_ids)
+            detections = detections[scores_ids]
+
+            return detections, scores[scores_ids], difficult_for_label[scores_ids]
+
+        def _prepare_annotations(annotation, label):
+            annotation_ids = annotation.labels == label
+            difficult_box_mask = np.full(annotation.size, False)
+            difficult_box_indices = annotation.metadata.get("difficult_boxes", [])
+            iscrowd = np.array(annotation.metadata.get('iscrowd', [0] * annotation.size))
+            difficult_box_mask[difficult_box_indices] = True
+            difficult_box_mask[iscrowd > 0] = True
+            difficult_label = difficult_box_mask[annotation_ids]
+            not_difficult_box_indices = np.argwhere(~difficult_label).reshape(-1)
+            difficult_box_indices = np.argwhere(difficult_label).reshape(-1)
+            iscrowd_label = iscrowd[annotation_ids]
+            order = np.hstack((not_difficult_box_indices, difficult_box_indices)).astype(int)
+            boxes = np.array(annotation.bboxes)
+            boxes = boxes[annotation_ids]
+            areas = np.array(annotation.areas)
+            areas = areas[annotation_ids] if np.size(areas) > 0 else np.array([])
+            boxes = boxes[order]
+            areas = areas[order]
+
+            return (
+                prepare_keypoints(annotation, annotation_ids)[order],
+                difficult_label[order],
+                iscrowd_label[order], boxes, areas
+            )
+
+        for label_id, label in enumerate(self.labels):
+            detections, scores, dt_difficult = _prepare_predictions(prediction, label, self.max_detections)
+            ground_truth, gt_difficult, iscrowd, boxes, areas = _prepare_annotations(annotation, label)
+            iou = compute_oks(ground_truth, detections, boxes, areas)
+            eval_result = evaluate_image(
+                ground_truth, gt_difficult, iscrowd, detections, dt_difficult, scores, iou, self.thresholds
+            )
+            self.matching_results[label_id].append(eval_result)
+            per_class_results.append(eval_result)
+
+        return per_class_results
+
+
+class MSCOCOKeypointsPrecision(MSCOCOKeypointsBaseMetric):
+    __provider__ = 'coco_keypoints_precision'
+
+    def update(self, annotation, prediction):
+        per_class_matching = super().update(annotation, prediction)
+        return [
+            compute_precision_recall(self.thresholds, [per_class_matching[i]])[0] for i, _ in enumerate(self.labels)
+        ]
+
+    def evaluate(self, annotations, predictions):
+        precision = [
+            compute_precision_recall(self.thresholds, self.matching_results[i])[0]
+            for i, _ in enumerate(self.labels)
+        ]
+        precision, self.meta['names'] = finalize_metric_result(precision, self.meta['names'])
+
+        return precision
+
+
+class MSCOCOKeypointsRecall(MSCOCOKeypointsBaseMetric):
+    __provider__ = 'coco_keypoints_precision'
+
+    def update(self, annotation, prediction):
+        per_class_matching = super().update(annotation, prediction)
+        return [
+            compute_precision_recall(self.thresholds, [per_class_matching[i]])[1] for i, _ in enumerate(self.labels)
+        ]
+
     def evaluate(self, annotations, predictions):
         recalls = [
             compute_precision_recall(self.thresholds, self.matching_results[i])[1]
             for i, _ in enumerate(self.labels)
         ]
+        recalls, self.meta['names'] = finalize_metric_result(recalls, self.meta['names'])
 
         return recalls
 
@@ -191,7 +310,7 @@ def prepare_annotations(annotation, label, create_boxes=False):
 
 def compute_precision_recall(thresholds, matching_results):
     num_thresholds = len(thresholds)
-    rectangle_thresholds = np.linspace(.0, 1.00, np.round((1.00 - .0) / .01) + 1, endpoint=True)
+    rectangle_thresholds = np.linspace(.0, 1.00, int(np.round((1.00 - .0) / .01)) + 1, endpoint=True)
     num_rec_thresholds = len(rectangle_thresholds)
     precision = -np.ones((num_thresholds, num_rec_thresholds))  # -1 for the precision of absent categories
     recall = -np.ones(num_thresholds)
@@ -205,6 +324,8 @@ def compute_precision_recall(thresholds, matching_results):
     fps = np.logical_and(np.logical_not(dtm), np.logical_not(dt_ignored))
     tp_sum = np.cumsum(tps, axis=1).astype(dtype=np.float)
     fp_sum = np.cumsum(fps, axis=1).astype(dtype=np.float)
+    if npig == 0:
+        return np.nan, np.nan
     for t, (tp, fp) in enumerate(zip(tp_sum, fp_sum)):
         tp = np.array(tp)
         fp = np.array(fp)
@@ -212,7 +333,6 @@ def compute_precision_recall(thresholds, matching_results):
         rc = tp / npig
         pr = tp / (fp + tp + np.spacing(1))
         q = np.zeros(num_rec_thresholds)
-
         if num_detections:
             recall[t] = rc[-1]
         else:
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/coco_orig_metrics.py b/tools/accuracy_checker/accuracy_checker/metrics/coco_orig_metrics.py
index f716476a8f9..bbbb52b4c4f 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/coco_orig_metrics.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/coco_orig_metrics.py
@@ -17,7 +17,14 @@
 import os
 import tempfile
 import json
-
+try:
+    from pycocotools.coco import COCO
+except ImportError:
+    COCO = None
+try:
+    from pycocotools.cocoeval import COCOeval as coco_eval
+except ImportError:
+    coco_eval = None
 from ..representation import (
     DetectionPrediction,
     DetectionAnnotation,
@@ -27,7 +34,7 @@
     PoseEstimationPrediction
 )
 from ..logging import print_info
-from ..config import BaseField
+from ..config import BaseField, ConfigError
 from ..utils import get_or_parse_value
 from .metric import FullDatasetEvaluationMetric
 from .coco_metrics import COCO_THRESHOLDS
@@ -37,6 +44,7 @@
 if SHOULD_DISPLAY_DEBUG_IMAGES:
     import cv2
 
+
 def box_to_coco(prediction_data_to_store, pred):
     x_mins = pred.x_mins.tolist()
     y_mins = pred.y_mins.tolist()
@@ -52,6 +60,7 @@ def box_to_coco(prediction_data_to_store, pred):
 
     return prediction_data_to_store
 
+
 def segm_to_coco(prediction_data_to_store, pred):
     encoded_masks = pred.mask
 
@@ -74,6 +83,7 @@ def keypoints_to_coco(prediction_data_to_store, pred):
 
     return prediction_data_to_store
 
+
 iou_specific_processing = {
     'bbox': box_to_coco,
     'segm': segm_to_coco,
@@ -109,19 +119,22 @@ def generate_map_pred_label_id_to_coco_cat_id(has_background, use_full_label_map
         return res_map
 
     def _prepare_coco_structures(self):
-        from pycocotools.coco import COCO
-
         annotation_conversion_parameters = self.dataset.config.get('annotation_conversion')
         if not annotation_conversion_parameters:
-            raise ValueError('annotation_conversion parameter is not pointed, '
-                             'but it is required for coco original metrics')
+            raise ConfigError('annotation_conversion parameter is not pointed, '
+                              'but it is required for coco original metrics')
         annotation_file = annotation_conversion_parameters.get('annotation_file')
         if not annotation_file.is_file():
-            raise ValueError("annotation file '{}' is not found".format(annotation_file))
+            raise ConfigError("annotation file '{}' is not found".format(annotation_file))
         has_background = annotation_conversion_parameters.get('has_background', False)
         use_full_label_map = annotation_conversion_parameters.get('use_full_label_map', False)
+        if not self.dataset.metadata:
+            raise ConfigError('coco orig metrics require dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
         meta = self.dataset.metadata
 
+        if COCO is None:
+            raise ValueError('pycocotools is not installed, please install it')
         coco = COCO(str(annotation_file))
         assert 0 not in coco.cats.keys()
         coco_cat_name_to_id = {v['name']: k for k, v in coco.cats.items()}
@@ -133,6 +146,9 @@ def _prepare_coco_structures(self):
             coco_cat_name_to_id[bg_name] = bg_lbl
         else:
             assert 'background_label' not in meta
+        if not meta.get('label_map'):
+            raise ConfigError('coco_orig metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerated annotation')
 
         if not use_full_label_map:
             map_pred_label_id_to_coco_cat_id = {k: coco_cat_name_to_id[v] for k, v in meta['label_map'].items()}
@@ -232,9 +248,9 @@ def _debug_printing_and_displaying_predictions(coco, coco_res, data_source, shou
 
     @staticmethod
     def _run_coco_evaluation(coco, coco_res, iou_type='bbox', threshold=None):
-        from pycocotools.cocoeval import COCOeval
-
-        cocoeval = COCOeval(coco, coco_res, iouType=iou_type)
+        if coco_eval is None:
+            raise ValueError('pycocotools is not installed, please install it before usage')
+        cocoeval = coco_eval(coco, coco_res, iouType=iou_type)
         if threshold is not None:
             cocoeval.params.iouThrs = threshold
         cocoeval.evaluate()
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/detection.py b/tools/accuracy_checker/accuracy_checker/metrics/detection.py
index 7265ccbc807..c1517c7d83b 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/detection.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/detection.py
@@ -23,12 +23,12 @@
 
 from ..utils import finalize_metric_result
 from .overlap import Overlap, IOA
-from ..config import BoolField, NumberField, StringField
+from ..config import BoolField, NumberField, StringField, ConfigError
 from ..representation import (
     DetectionAnnotation, DetectionPrediction,
     ActionDetectionPrediction, ActionDetectionAnnotation
 )
-from .metric import Metric, FullDatasetEvaluationMetric
+from .metric import Metric, FullDatasetEvaluationMetric, PerImageEvaluationMetric
 
 
 class APIntegralType(enum.Enum):
@@ -82,8 +82,14 @@ def configure(self):
         self.use_filtered_tp = self.get_value_from_config('use_filtered_tp')
 
         label_map = self.config.get('label_map', 'label_map')
+        if not self.dataset.metadata:
+            raise ConfigError('detection metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
         labels = self.dataset.metadata.get(label_map, {})
-        self.labels = labels.keys()
+        if not labels:
+            raise ConfigError('detection metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
+        self.labels = list(labels.keys())
         valid_labels = list(filter(lambda x: x != self.dataset.metadata.get('background_label'), self.labels))
         self.meta['names'] = [labels[name] for name in valid_labels]
 
@@ -127,8 +133,14 @@ def per_class_detection_statistics(self, annotations, predictions, labels):
     def evaluate(self, annotations, predictions):
         pass
 
+    def reset(self):
+        label_map = self.config.get('label_map', 'label_map')
+        dataset_labels = self.dataset.metadata.get(label_map, {})
+        valid_labels = list(filter(lambda x: x != self.dataset.metadata.get('background_label'), dataset_labels))
+        self.meta['names'] = [dataset_labels[name] for name in valid_labels]
+
 
-class DetectionMAP(BaseDetectionMetricMixin, FullDatasetEvaluationMetric):
+class DetectionMAP(BaseDetectionMetricMixin, FullDatasetEvaluationMetric, PerImageEvaluationMetric):
     """
     Class for evaluating mAP metric of detection models.
     """
@@ -156,7 +168,19 @@ def configure(self):
         super().configure()
         self.integral = APIntegralType(self.get_value_from_config('integral'))
 
+    def update(self, annotation, prediction):
+        return self._calculate_map([annotation], [prediction])
+
     def evaluate(self, annotations, predictions):
+        average_precisions = self._calculate_map(annotations, predictions)
+        average_precisions, self.meta['names'] = finalize_metric_result(average_precisions, self.meta['names'])
+        if not average_precisions:
+            warnings.warn("No detections to compute mAP")
+            average_precisions.append(0)
+
+        return average_precisions
+
+    def _calculate_map(self, annotations, predictions):
         valid_labels = get_valid_labels(self.labels, self.dataset.metadata.get('background_label'))
         labels_stat = self.per_class_detection_statistics(annotations, predictions, valid_labels)
 
@@ -170,15 +194,10 @@ def evaluate(self, annotations, predictions):
             else:
                 average_precisions.append(np.nan)
 
-        average_precisions, self.meta['names'] = finalize_metric_result(average_precisions, self.meta['names'])
-        if not average_precisions:
-            warnings.warn("No detections to compute mAP")
-            average_precisions.append(0)
-
         return average_precisions
 
 
-class MissRate(BaseDetectionMetricMixin, FullDatasetEvaluationMetric):
+class MissRate(BaseDetectionMetricMixin, FullDatasetEvaluationMetric, PerImageEvaluationMetric):
     """
     Class for evaluating Miss Rate metric of detection models.
     """
@@ -200,6 +219,21 @@ def configure(self):
         super().configure()
         self.fppi_level = self.get_value_from_config('fppi_level')
 
+    def update(self, annotation, prediction):
+        valid_labels = get_valid_labels(self.labels, self.dataset.metadata.get('background_label'))
+        labels_stat = self.per_class_detection_statistics([annotation], [prediction], valid_labels)
+        miss_rates = []
+        for label in labels_stat:
+            label_miss_rate = 1.0 - labels_stat[label]['recall']
+            label_fppi = labels_stat[label]['fppi']
+
+            position = bisect.bisect_left(label_fppi, self.fppi_level)
+            m0 = max(0, position - 1)
+            m1 = position if position < len(label_miss_rate) else m0
+            miss_rates.append(0.5 * (label_miss_rate[m0] + label_miss_rate[m1]))
+
+        return miss_rates
+
     def evaluate(self, annotations, predictions):
         valid_labels = get_valid_labels(self.labels, self.dataset.metadata.get('background_label'))
         labels_stat = self.per_class_detection_statistics(annotations, predictions, valid_labels)
@@ -217,7 +251,7 @@ def evaluate(self, annotations, predictions):
         return miss_rates
 
 
-class Recall(BaseDetectionMetricMixin, FullDatasetEvaluationMetric):
+class Recall(BaseDetectionMetricMixin, FullDatasetEvaluationMetric, PerImageEvaluationMetric):
     """
     Class for evaluating recall metric of detection models.
     """
@@ -227,7 +261,19 @@ class Recall(BaseDetectionMetricMixin, FullDatasetEvaluationMetric):
     annotation_types = (DetectionAnnotation, ActionDetectionAnnotation)
     prediction_types = (DetectionPrediction, ActionDetectionPrediction)
 
+    def update(self, annotation, prediction):
+        return self._calculate_recall([annotation], [prediction])
+
     def evaluate(self, annotations, predictions):
+        recalls = self._calculate_recall(annotations, predictions)
+        recalls, self.meta['names'] = finalize_metric_result(recalls, self.meta['names'])
+        if not recalls:
+            warnings.warn("No detections to compute mAP")
+            recalls.append(0)
+
+        return recalls
+
+    def _calculate_recall(self, annotations, predictions):
         valid_labels = get_valid_labels(self.labels, self.dataset.metadata.get('background_label'))
         labels_stat = self.per_class_detection_statistics(annotations, predictions, valid_labels)
 
@@ -240,15 +286,10 @@ def evaluate(self, annotations, predictions):
             else:
                 recalls.append(np.nan)
 
-        recalls, self.meta['names'] = finalize_metric_result(recalls, self.meta['names'])
-        if not recalls:
-            warnings.warn("No detections to compute mAP")
-            recalls.append(0)
-
         return recalls
 
 
-class DetectionAccuracyMetric(BaseDetectionMetricMixin, FullDatasetEvaluationMetric):
+class DetectionAccuracyMetric(BaseDetectionMetricMixin, PerImageEvaluationMetric):
     __provider__ = 'detection_accuracy'
 
     annotation_types = (DetectionAnnotation, ActionDetectionAnnotation)
@@ -277,29 +318,32 @@ def configure(self):
         self.ignore_label = self.get_value_from_config('ignore_label')
         fast_match = self.get_value_from_config('fast_match')
         self.match_func = match_detections_class_agnostic if not fast_match else fast_match_detections_class_agnostic
+        self.cm = np.zeros([len(self.labels), len(self.labels)], dtype=np.int32)
+
+    def update(self, annotation, prediction):
+        matches = self.match_func(prediction, annotation, self.overlap_threshold, self.overlap_method)
+        update_cm = confusion_matrix(matches, prediction, annotation, len(self.labels), self.ignore_label)
+        self.cm += update_cm
+        if self.use_normalization:
+            return np.mean(normalize_confusion_matrix(update_cm).diagonal())
+        return float(np.sum(update_cm.diagonal())) / float(np.maximum(1, np.sum(update_cm)))
 
     def evaluate(self, annotations, predictions):
-        all_matches = self.match_func(
-            predictions, annotations, self.overlap_threshold, self.overlap_method
-        )
-        cm = confusion_matrix(all_matches, predictions, annotations, len(self.labels), self.ignore_label)
         if self.use_normalization:
-            return np.mean(normalize_confusion_matrix(cm).diagonal())
+            return np.mean(normalize_confusion_matrix(self.cm).diagonal())
 
-        return float(np.sum(cm.diagonal())) / float(np.maximum(1, np.sum(cm)))
+        return float(np.sum(self.cm.diagonal())) / float(np.maximum(1, np.sum(self.cm)))
 
 
-def confusion_matrix(all_matched_ids, predicted_data, gt_data, num_classes, ignore_label=None):
+def confusion_matrix(matched_ids, prediction, gt, num_classes, ignore_label=None):
     out_cm = np.zeros([num_classes, num_classes], dtype=np.int32)
-    for gt, prediction in zip(gt_data, predicted_data):
-        for match_pair in all_matched_ids[gt.identifier]:
-            gt_label = int(gt.labels[match_pair[0]])
-
-            if ignore_label and gt_label == ignore_label:
-                continue
+    for match_pair in matched_ids:
+        gt_label = int(gt.labels[match_pair[0]])
+        if ignore_label and gt_label == ignore_label:
+            continue
 
-            pred_label = int(prediction.labels[match_pair[1]])
-            out_cm[gt_label, pred_label] += 1
+        pred_label = int(prediction.labels[match_pair[1]])
+        out_cm[gt_label, pred_label] += 1
 
     return out_cm
 
@@ -309,91 +353,72 @@ def normalize_confusion_matrix(cm):
     return cm.astype(np.float32) / row_sums
 
 
-def match_detections_class_agnostic(predicted_data, gt_data, min_iou, overlap_method):
-    all_matches = {}
-    total_gt_bbox_num = 0
-    matched_gt_bbox_num = 0
-
-    for gt, prediction in zip(gt_data, predicted_data):
-        gt_bboxes = np.stack((gt.x_mins, gt.y_mins, gt.x_maxs, gt.y_maxs), axis=-1)
-        predicted_bboxes = np.stack(
-            (prediction.x_mins, prediction.y_mins, prediction.x_maxs, prediction.y_maxs), axis=-1
-        )
-        predicted_scores = prediction.scores
-
-        gt_bboxes_num = len(gt_bboxes)
-        predicted_bboxes_num = len(predicted_bboxes)
-
-        sorted_ind = np.argsort(-predicted_scores)
-        predicted_bboxes = predicted_bboxes[sorted_ind]
-        predicted_original_ids = np.arange(predicted_bboxes_num)[sorted_ind]
-
-        similarity_matrix = calculate_similarity_matrix(predicted_bboxes, gt_bboxes, overlap_method)
-
-        matches = []
-        visited_gt = np.zeros(gt_bboxes_num, dtype=np.bool)
-        for predicted_id in range(predicted_bboxes_num):
-            best_overlap = 0.0
-            best_gt_id = -1
-            for gt_id in range(gt_bboxes_num):
-                if visited_gt[gt_id]:
-                    continue
+def match_detections_class_agnostic(prediction, gt, min_iou, overlap_method):
+    gt_bboxes = np.stack((gt.x_mins, gt.y_mins, gt.x_maxs, gt.y_maxs), axis=-1)
+    predicted_bboxes = np.stack(
+        (prediction.x_mins, prediction.y_mins, prediction.x_maxs, prediction.y_maxs), axis=-1
+    )
+    predicted_scores = prediction.scores
 
-                overlap_value = similarity_matrix[predicted_id, gt_id]
-                if overlap_value > best_overlap:
-                    best_overlap = overlap_value
-                    best_gt_id = gt_id
+    gt_bboxes_num = len(gt_bboxes)
+    predicted_bboxes_num = len(predicted_bboxes)
 
-            if best_gt_id >= 0 and best_overlap > min_iou:
-                visited_gt[best_gt_id] = True
+    sorted_ind = np.argsort(-predicted_scores)
+    predicted_bboxes = predicted_bboxes[sorted_ind]
+    predicted_original_ids = np.arange(predicted_bboxes_num)[sorted_ind]
 
-                matches.append((best_gt_id, predicted_original_ids[predicted_id]))
-                if len(matches) >= gt_bboxes_num:
-                    break
+    similarity_matrix = calculate_similarity_matrix(predicted_bboxes, gt_bboxes, overlap_method)
 
-        all_matches[gt.identifier] = matches
+    matches = []
+    visited_gt = np.zeros(gt_bboxes_num, dtype=np.bool)
+    for predicted_id in range(predicted_bboxes_num):
+        best_overlap = 0.0
+        best_gt_id = -1
+        for gt_id in range(gt_bboxes_num):
+            if visited_gt[gt_id]:
+                continue
 
-        total_gt_bbox_num += gt_bboxes_num
-        matched_gt_bbox_num += len(matches)
+            overlap_value = similarity_matrix[predicted_id, gt_id]
+            if overlap_value > best_overlap:
+                best_overlap = overlap_value
+                best_gt_id = gt_id
 
-    return all_matches
+        if best_gt_id >= 0 and best_overlap > min_iou:
+            visited_gt[best_gt_id] = True
 
+            matches.append((best_gt_id, predicted_original_ids[predicted_id]))
+            if len(matches) >= gt_bboxes_num:
+                break
 
-def fast_match_detections_class_agnostic(predicted_data, gt_data, min_iou, overlap_method):
-    all_matches = {}
-    total_gt_bbox_num = 0
-    matched_gt_bbox_num = 0
+    return matches
 
-    for gt, prediction in zip(gt_data, predicted_data):
-        gt_bboxes = np.stack((gt.x_mins, gt.y_mins, gt.x_maxs, gt.y_maxs), axis=-1)
-        matches = []
-        total_gt_bbox_num += len(gt_bboxes)
-        if prediction.size:
-            predicted_bboxes = np.stack(
-                (prediction.x_mins, prediction.y_mins, prediction.x_maxs, prediction.y_maxs), axis=-1
-            )
 
-            similarity_matrix = calculate_similarity_matrix(gt_bboxes, predicted_bboxes, overlap_method)
+def fast_match_detections_class_agnostic(prediction, gt, min_iou, overlap_method):
+    matches = []
+    gt_bboxes = np.stack((gt.x_mins, gt.y_mins, gt.x_maxs, gt.y_maxs), axis=-1)
+    if prediction.size:
+        predicted_bboxes = np.stack(
+            (prediction.x_mins, prediction.y_mins, prediction.x_maxs, prediction.y_maxs), axis=-1
+        )
 
-            for _ in gt_bboxes:
-                best_match_pos = np.unravel_index(similarity_matrix.argmax(), similarity_matrix.shape)
-                best_match_value = similarity_matrix[best_match_pos]
+        similarity_matrix = calculate_similarity_matrix(gt_bboxes, predicted_bboxes, overlap_method)
 
-                if best_match_value <= min_iou:
-                    break
+        for _ in gt_bboxes:
+            best_match_pos = np.unravel_index(similarity_matrix.argmax(), similarity_matrix.shape)
+            best_match_value = similarity_matrix[best_match_pos]
 
-                gt_id = best_match_pos[0]
-                predicted_id = best_match_pos[1]
+            if best_match_value <= min_iou:
+                break
 
-                similarity_matrix[gt_id, :] = 0.0
-                similarity_matrix[:, predicted_id] = 0.0
+            gt_id = best_match_pos[0]
+            predicted_id = best_match_pos[1]
 
-                matches.append((gt_id, predicted_id))
-                matched_gt_bbox_num += 1
+            similarity_matrix[gt_id, :] = 0.0
+            similarity_matrix[:, predicted_id] = 0.0
 
-        all_matches[gt.identifier] = matches
+            matches.append((gt_id, predicted_id))
 
-    return all_matches
+    return matches
 
 
 def calculate_similarity_matrix(set_a, set_b, overlap):
@@ -540,7 +565,8 @@ def _prepare_annotation_boxes(annotation, ignore_difficult, label):
 
         difficult_boxes[ground_truth.identifier] = difficult_box_mask
         if ignore_difficult:
-            num_ground_truth -= np.sum(difficult_box_mask)
+            if np.size(difficult_box_mask) > 0:
+                num_ground_truth -= np.sum(difficult_box_mask)
 
     return used_boxes, num_ground_truth, difficult_boxes
 
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/hit_ratio.py b/tools/accuracy_checker/accuracy_checker/metrics/hit_ratio.py
index de27dccf9c9..8404ce3bfef 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/hit_ratio.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/hit_ratio.py
@@ -20,10 +20,11 @@
 import numpy as np
 
 from ..representation import HitRatioAnnotation, HitRatioPrediction
-from .metric import FullDatasetEvaluationMetric
+from .metric import PerImageEvaluationMetric
 from ..config import NumberField
 
-class BaseRecommenderMetric(FullDatasetEvaluationMetric):
+
+class BaseRecommenderMetric(PerImageEvaluationMetric):
     annotation_types = (HitRatioAnnotation, )
     prediction_types = (HitRatioPrediction, )
 
@@ -108,3 +109,28 @@ class NDSGMetric(BaseRecommenderMetric):
 
     def __init__(self, *args, **kwargs):
         super().__init__(ndcg_discounter, *args, **kwargs)
+
+
+class LogLoss(PerImageEvaluationMetric):
+    __provider__ = 'log_loss'
+
+    annotation_types = (HitRatioAnnotation, )
+    prediction_types = (HitRatioPrediction, )
+
+    def configure(self):
+        self.losses = []
+        self.meta.update({
+            'scale': 1, 'postfix': ' ', 'calculate_mean': False, 'target': 'higher-worse'
+        })
+
+    def update(self, annotation, prediction):
+        score = np.clip(prediction.scores, 1e-15, 1 - 1e-15)
+        loss = -np.log(score) if annotation.positive else -np.log(1. - score)
+        self.losses.append(loss)
+        return loss
+
+    def evaluate(self, annotations, predictions):
+        return np.mean(self.losses)
+
+    def reset(self):
+        self.losses = []
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/metric.py b/tools/accuracy_checker/accuracy_checker/metrics/metric.py
index 72bd4dd0308..4895b1aa62c 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/metric.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/metric.py
@@ -15,6 +15,7 @@
 """
 
 import copy
+from collections import namedtuple
 from ..representation import ContainerRepresentation
 from ..config import ConfigError
 from ..utils import is_single_metric_source, get_supported_representations
@@ -23,6 +24,8 @@
 from ..dependency import ClassProvider
 from ..utils import zipped_transform, get_parameter_value_from_config, contains_any
 
+PerImageMetricResult = namedtuple('PerImageMetricResult', ['metric_name', 'metric_type', 'result', 'direction'])
+
 
 class Metric(ClassProvider):
     """
@@ -42,7 +45,7 @@ def __init__(self, config, dataset, name=None, state=None):
         self.dataset = dataset
         self.state = state
         self._update_iter = 0
-        self.meta = {}
+        self.meta = {'target': 'higher-better'}
         self._initial_state = copy.deepcopy(state)
 
         self.validate_config()
@@ -92,7 +95,8 @@ def get_value_from_config(self, key):
         return get_parameter_value_from_config(self.config, self.parameters(), key)
 
     def submit(self, annotation, prediction):
-        self.update(annotation, prediction)
+        direction = self.meta.get('target', 'higher-better')
+        return PerImageMetricResult(self.name, self.config['type'], self.update(annotation, prediction), direction)
 
     def submit_all(self, annotations, predictions):
         return self.evaluate(annotations, predictions)
@@ -182,7 +186,10 @@ def reset(self):
 class PerImageEvaluationMetric(Metric):
     def submit(self, annotation, prediction):
         annotation_, prediction_ = self._resolve_representation_containers(annotation, prediction)
-        self.update(annotation_, prediction_)
+        metric_result = self.update(annotation_, prediction_)
+        direction = self.meta.get('target', 'higher-better')
+
+        return PerImageMetricResult(self.name, self.config['type'], metric_result, direction)
 
     def evaluate(self, annotations, predictions):
         raise NotImplementedError
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/metric_executor.py b/tools/accuracy_checker/accuracy_checker/metrics/metric_executor.py
index f3d5426f46d..45464ce996b 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/metric_executor.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/metric_executor.py
@@ -14,12 +14,11 @@
 limitations under the License.
 """
 
-from collections import namedtuple
+from collections import namedtuple, OrderedDict
 
 from ..presenters import BasePresenter, EvaluationResult
 from ..config import StringField
-from ..utils import zipped_transform
-from .metric import Metric
+from .metric import Metric, FullDatasetEvaluationMetric
 from ..config import ConfigValidator, ConfigError
 
 MetricInstance = namedtuple(
@@ -42,34 +41,9 @@ def __init__(self, metrics_config, dataset=None, state=None):
         self._dataset = dataset
 
         self.metrics = []
-        type_ = 'type'
-        identifier = 'name'
-        reference = 'reference'
-        threshold = 'threshold'
-        presenter = 'presenter'
+        self.need_store_predictions = False
         for metric_config_entry in metrics_config:
-            metric_config = ConfigValidator(
-                "metrics", on_extra_argument=ConfigValidator.IGNORE_ON_EXTRA_ARGUMENT,
-                fields=self.parameters()
-            )
-            metric_type = metric_config_entry.get(type_)
-            metric_config.validate(metric_config_entry, type_)
-
-            metric_identifier = metric_config_entry.get(identifier, metric_type)
-
-            metric_fn = Metric.provide(
-                metric_type, metric_config_entry, self.dataset, metric_identifier, state=self.state
-            )
-            metric_presenter = BasePresenter.provide(metric_config_entry.get(presenter, 'print_scalar'))
-
-            self.metrics.append(MetricInstance(
-                metric_identifier,
-                metric_type,
-                metric_fn,
-                metric_config_entry.get(reference),
-                metric_config_entry.get(threshold),
-                metric_presenter
-            ))
+            self.register_metric(metric_config_entry)
 
     @classmethod
     def parameters(cls):
@@ -90,7 +64,9 @@ def _set_dataset(self, dataset):
             metric.metric_fn.dataset = dataset
 
     def __call__(self, context, *args, **kwargs):
-        self.update_metrics_on_batch(context.annotation_batch, context.prediction_batch)
+        self.update_metrics_on_batch(
+            context.input_ids_batch, context.annotation_batch, context.prediction_batch
+        )
         context.annotations.extend(context.annotation_batch)
         context.predictions.extend(context.prediction_batch)
 
@@ -99,10 +75,14 @@ def update_metrics_on_object(self, annotation, prediction):
         Updates metric value corresponding given annotation and prediction objects.
         """
 
+        metric_results = []
+
         for metric in self.metrics:
-            metric.metric_fn.submit(annotation, prediction)
+            metric_results.append(metric.metric_fn.submit(annotation, prediction))
+
+        return metric_results
 
-    def update_metrics_on_batch(self, annotation, prediction):
+    def update_metrics_on_batch(self, batch_ids, annotation, prediction):
         """
         Updates metric value corresponding given batch.
 
@@ -111,7 +91,12 @@ def update_metrics_on_batch(self, annotation, prediction):
             prediction: list of batch number of prediction objects.
         """
 
-        zipped_transform(self.update_metrics_on_object, annotation, prediction)
+        results = OrderedDict()
+
+        for input_id, single_annotation, single_prediction in zip(batch_ids, annotation, prediction):
+            results[input_id] = self.update_metrics_on_object(single_annotation, single_prediction)
+
+        return results
 
     def iterate_metrics(self, annotations, predictions):
         for name, metric_type, functor, reference, threshold, presenter in self.metrics:
@@ -124,9 +109,51 @@ def iterate_metrics(self, annotations, predictions):
                 meta=functor.meta,
             )
 
+    def register_metric(self, metric_config_entry):
+        type_ = 'type'
+        identifier = 'name'
+        reference = 'reference'
+        threshold = 'threshold'
+        presenter = 'presenter'
+        metric_config_validator = ConfigValidator(
+            "metrics", on_extra_argument=ConfigValidator.IGNORE_ON_EXTRA_ARGUMENT,
+            fields=self.parameters()
+        )
+        metric_type = metric_config_entry.get(type_)
+        metric_config_validator.validate(metric_config_entry, type_)
+
+        metric_identifier = metric_config_entry.get(identifier, metric_type)
+
+        metric_fn = Metric.provide(
+            metric_type, metric_config_entry, self.dataset, metric_identifier, state=self.state
+        )
+        metric_presenter = BasePresenter.provide(metric_config_entry.get(presenter, 'print_scalar'))
+
+        self.metrics.append(MetricInstance(
+            metric_identifier,
+            metric_type,
+            metric_fn,
+            metric_config_entry.get(reference),
+            metric_config_entry.get(threshold),
+            metric_presenter
+        ))
+        if isinstance(metric_fn, FullDatasetEvaluationMetric):
+            self.need_store_predictions = True
+
     def get_metric_presenters(self):
         return [metric.presenter for metric in self.metrics]
 
+    def get_metrics_direction(self):
+        return {metric.name: metric.metric_fn.meta.get('target', 'higher-better') for metric in self.metrics}
+
+    def get_metrics_attributes(self):
+        return {
+            metric.name: {
+                'direction':  metric.metric_fn.meta.get('target', 'higher-better'),
+                'type': metric.metric_type
+            } for metric in self.metrics
+        }
+
     def reset(self):
         for metric in self.metrics:
             metric.metric_fn.reset()
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/mpjpe_multiperson.py b/tools/accuracy_checker/accuracy_checker/metrics/mpjpe_multiperson.py
new file mode 100644
index 00000000000..a5b9ef07e17
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/metrics/mpjpe_multiperson.py
@@ -0,0 +1,112 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import warnings
+import numpy as np
+from ..representation import PoseEstimation3dPrediction, PoseEstimation3dAnnotation
+from .metric import PerImageEvaluationMetric
+
+
+class MpjpeMultiperson(PerImageEvaluationMetric):
+    __provider__ = 'mpjpe_multiperson'
+    annotation_types = (PoseEstimation3dAnnotation,)
+    prediction_types = (PoseEstimation3dPrediction,)
+
+    def __init__(self, config, dataset, name=None, state=None):
+        super().__init__(config, dataset, name, state)
+        self.per_image_mpjpe = []
+        self.meta.update({
+            'scale': 10,
+            'postfix': 'mm',
+            'target': 'higher-worse',
+        })
+
+    def update(self, annotation, prediction):
+        # since pelvis does not detected, remove it before evaluation
+        kpt_mask = np.ones_like(annotation.x_3d_values[0], dtype=bool)
+        kpt_mask[2] = False
+        annotation.x_3d_values = annotation.x_3d_values[:, kpt_mask]
+        annotation.y_3d_values = annotation.y_3d_values[:, kpt_mask]
+        annotation.z_3d_values = annotation.z_3d_values[:, kpt_mask]
+        if prediction.size:
+            prediction.x_3d_values = prediction.x_3d_values[:, kpt_mask]
+            prediction.y_3d_values = prediction.y_3d_values[:, kpt_mask]
+            prediction.z_3d_values = prediction.z_3d_values[:, kpt_mask]
+
+        matching_results = []
+        sorted_prediction_ids = np.argsort(-prediction.scores, kind='stable')
+        mask = np.ones(annotation.size, dtype=bool)
+        for prediction_id in range(prediction.size):
+            max_iou = 0
+            matched_id = -1
+            bbox = prediction.bboxes[sorted_prediction_ids[prediction_id]]
+            for annotation_id in range(annotation.size):
+                if not mask[annotation_id]:
+                    continue
+                iou = _get_iou(bbox, annotation.bboxes[annotation_id])
+                if iou > max_iou:
+                    max_iou = iou
+                    matched_id = annotation_id
+            if matched_id >= 0:
+                mask[matched_id] = 0
+                gt_coordinates = np.transpose(np.array(
+                    [annotation.x_3d_values[matched_id], annotation.y_3d_values[matched_id],
+                     annotation.z_3d_values[matched_id]]), (1, 0))
+                predicted_coordinates = np.transpose(np.array(
+                    [prediction.x_3d_values[sorted_prediction_ids[prediction_id]],
+                     prediction.y_3d_values[sorted_prediction_ids[prediction_id]],
+                     prediction.z_3d_values[sorted_prediction_ids[prediction_id]]]), (1, 0))
+                matching_results.append((gt_coordinates, predicted_coordinates))
+
+        image_mpjpe = 0
+        for gt, target in matching_results:
+            image_mpjpe += _mpjpe(gt, target)
+        if matching_results:
+            image_mpjpe /= len(matching_results)
+        self.per_image_mpjpe.append(image_mpjpe)
+        return image_mpjpe
+
+    def evaluate(self, annotations, predictions):
+        total_mpjpe = 0
+        for image_mpjpe in self.per_image_mpjpe:
+            total_mpjpe += image_mpjpe
+        if self.per_image_mpjpe:
+            total_mpjpe /= len(self.per_image_mpjpe)
+        else:
+            warnings.warn('No predicted results to compute MPJPE')
+        return total_mpjpe
+
+    def reset(self):
+        self.per_image_mpjpe = []
+
+
+def _get_iou(box_a, box_b):
+    tl_x = max(box_a[0], box_b[0])
+    tl_y = max(box_a[1], box_b[1])
+    br_x = min(box_a[2], box_b[2])
+    br_y = min(box_a[3], box_b[3])
+    intersection_area = max(0, br_x - tl_x) * max(0, br_y - tl_y)
+
+    area_a = (box_a[2] - box_a[0]) * (box_a[3] - box_a[1])
+    area_b = (box_b[2] - box_b[0]) * (box_b[3] - box_b[1])
+    iou = intersection_area / np.float32(area_a + area_b - intersection_area)
+
+    return iou
+
+
+def _mpjpe(gt, target):
+    jpe = np.linalg.norm(gt - target)
+    return jpe / target.shape[0]
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/multilabel_recognition.py b/tools/accuracy_checker/accuracy_checker/metrics/multilabel_recognition.py
index 16a75990a12..4b8cb937094 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/multilabel_recognition.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/multilabel_recognition.py
@@ -17,7 +17,7 @@
 import numpy as np
 from .metric import PerImageEvaluationMetric
 from ..representation import MultiLabelRecognitionAnnotation, MultiLabelRecognitionPrediction
-from ..config import StringField, BoolField, ConfigValidator
+from ..config import StringField, BoolField, ConfigValidator, ConfigError
 
 
 class MultiLabelMetric(PerImageEvaluationMetric):
@@ -40,21 +40,20 @@ def parameters(cls):
         return parameters
 
     def configure(self):
+        if not self.dataset.metadata:
+            raise ConfigError('multi label metrics require  dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
         self.labels = self.dataset.metadata.get(self.get_value_from_config('label_map'))
+        if not self.labels:
+            raise ConfigError('multi label metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerate annotation')
         self.calculate_average = self.get_value_from_config('calculate_average')
-
-        self.meta['scale'] = 1
-        self.meta['postfix'] = ''
-        self.meta['calculate_mean'] = False
-        self.meta['names'] = list(self.labels.values())
-        if self.calculate_average:
-            self.meta['names'].append('average')
         self.tp = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.fp = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.tn = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.fn = np.zeros_like(list(self.labels.keys()), dtype=np.float)
-
         self.counter = np.zeros_like(list(self.labels.keys()), dtype=np.float)
+        self._create_meta()
 
     def update(self, annotation, prediction):
         def loss(annotation_labels, prediction_labels):
@@ -99,12 +98,21 @@ def counter(annotation_label):
     def evaluate(self, annotations, predictions):
         pass
 
+    def _create_meta(self):
+        self.meta['scale'] = 1
+        self.meta['postfix'] = ''
+        self.meta['calculate_mean'] = False
+        self.meta['names'] = list(self.labels.values())
+        if self.calculate_average:
+            self.meta['names'].append('average')
+
     def reset(self):
         self.tp = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.fp = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.tn = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.fn = np.zeros_like(list(self.labels.keys()), dtype=np.float)
         self.counter = np.zeros_like(list(self.labels.keys()), dtype=np.float)
+        self._create_meta()
 
 
 class MultiLabelAccuracy(MultiLabelMetric):
@@ -177,17 +185,16 @@ def validate_config(self):
         ).validate(self.config)
 
     def configure(self):
+        if not self.dataset.metadata:
+            raise ConfigError('f1-score metric requires dataset metadata providing'
+                              'Please provide dataset meta file or regenerated annotation')
         label_map = self.get_value_from_config('label_map')
         self.labels = self.dataset.metadata.get(label_map)
+        if not self.labels:
+            raise ConfigError('f1-score metric requires label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerated annotation')
         self.calculate_average = self.get_value_from_config('calculate_average')
-        self.meta['names'] = list(self.labels.values())
-        if self.calculate_average:
-            self.meta['names'].append('average')
-
-        self.meta['scale'] = 1
-        self.meta['postfix'] = ''
-        self.meta['calculate_mean'] = False
-        self.meta['names'] = list(self.labels.values()) + ['average']
+        self._create_meta()
 
     def update(self, annotation, prediction):
         self.precision.update(annotation, prediction)
@@ -214,3 +221,12 @@ def evaluate(self, annotations, predictions):
     def reset(self):
         self.precision.reset()
         self.recall.reset()
+        self._create_meta()
+
+    def _create_meta(self):
+        self.meta['names'] = list(self.labels.values())
+        if self.calculate_average:
+            self.meta['names'].append('average')
+        self.meta['scale'] = 1
+        self.meta['postfix'] = ''
+        self.meta['calculate_mean'] = False
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/question_answering.py b/tools/accuracy_checker/accuracy_checker/metrics/question_answering.py
new file mode 100644
index 00000000000..8f40fbc98ff
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/metrics/question_answering.py
@@ -0,0 +1,93 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import re
+from collections import Counter
+
+from ..representation import QuestionAnsweringAnnotation, QuestionAnsweringPrediction
+from .metric import PerImageEvaluationMetric
+
+
+def normalize_answer(s):
+    def remove_articles(text):
+        return re.sub(r'\b(a|an|the)\b', ' ', text)
+
+    def white_space_fix(text):
+        return ' '.join(text.split())
+
+    def remove_punc(text):
+        exclude = set('!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~')
+        return ''.join(ch for ch in text if ch not in exclude)
+
+    return white_space_fix(remove_articles(remove_punc(s.lower())))
+
+
+class ScoreF1(PerImageEvaluationMetric):
+    __provider__ = 'f1'
+
+    annotation_types = (QuestionAnsweringAnnotation,)
+    prediction_types = (QuestionAnsweringPrediction,)
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.f1 = 0
+        self.total = 0
+
+    def update(self, annotation, prediction):
+        max_f1_score = 0
+        for gt_answer in annotation.orig_answer_text:
+            for pred_answer in prediction.tokens:
+                prediction_tokens = normalize_answer(pred_answer).split()
+                annotation_tokens = normalize_answer(gt_answer['text']).split()
+                common = Counter(prediction_tokens) & Counter(annotation_tokens)
+                same = sum(common.values())
+                if same == 0:
+                    continue
+                precision = 1.0 * same / len(prediction_tokens)
+                recall = 1.0 * same / len(annotation_tokens)
+                f1 = (2 * precision * recall) / (precision + recall)
+                max_f1_score = f1 if f1 > max_f1_score else max_f1_score
+        self.f1 += max_f1_score
+        self.total += 1
+        return max_f1_score
+
+    def evaluate(self, annotation, prediction):
+        return self.f1 / self.total
+
+
+class ExactMatchScore(PerImageEvaluationMetric):
+    __provider__ = 'exact_match'
+
+    annotation_types = (QuestionAnsweringAnnotation,)
+    prediction_types = (QuestionAnsweringPrediction,)
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.exact_match = 0
+        self.total = 0
+
+    def update(self, annotation, prediction):
+        max_exact_match = 0
+        for gt_answer in annotation.orig_answer_text:
+            for pred_answer in prediction.tokens:
+                exact_match = normalize_answer(gt_answer['text']) == normalize_answer(pred_answer)
+                max_exact_match = exact_match if exact_match > max_exact_match else max_exact_match
+        self.exact_match += max_exact_match
+        self.total += 1
+        return max_exact_match
+
+    def evaluate(self, annotation, prediction):
+        return self.exact_match / self.total
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/regression.py b/tools/accuracy_checker/accuracy_checker/metrics/regression.py
index d6390e0f655..5dda31e5bd2 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/regression.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/regression.py
@@ -43,11 +43,16 @@ def __init__(self, value_differ, *args, **kwargs):
         self.value_differ = value_differ
 
     def configure(self):
-        self.meta.update({'names': ['mean', 'std'], 'scale': 1, 'postfix': ' ', 'calculate_mean': False})
+        self.meta.update({
+            'names': ['mean', 'std'], 'scale': 1, 'postfix': ' ', 'calculate_mean': False, 'target': 'higher-worse'
+        })
         self.magnitude = []
 
     def update(self, annotation, prediction):
-        self.magnitude.append(self.value_differ(annotation.value, prediction.value))
+        diff = self.value_differ(annotation.value, prediction.value)
+        self.magnitude.append(diff)
+
+        return diff
 
     def evaluate(self, annotations, predictions):
         return np.mean(self.magnitude), np.std(self.magnitude)
@@ -90,7 +95,7 @@ def __init__(self, value_differ, *args, **kwargs):
         self.value_differ = value_differ
 
     def configure(self):
-        self.meta.update({'scale': 1, 'postfix': ' ', 'calculate_mean': False})
+        self.meta.update({'scale': 1, 'postfix': ' ', 'calculate_mean': False, 'target': 'higher-worse'})
         self.ignore_out_of_range = self.get_value_from_config('ignore_values_not_in_interval')
 
         self.intervals = self.get_value_from_config('intervals')
@@ -108,22 +113,14 @@ def configure(self):
 
         self.intervals = np.unique(self.intervals)
         self.magnitude = [[] for _ in range(len(self.intervals) + 1)]
-
-        self.meta['names'] = ([])
-        if not self.ignore_out_of_range:
-            self.meta['names'] = (['mean: < ' + str(self.intervals[0]), 'std: < ' + str(self.intervals[0])])
-
-        for index in range(len(self.intervals) - 1):
-            self.meta['names'].append('mean: <= ' + str(self.intervals[index]) + ' < ' + str(self.intervals[index + 1]))
-            self.meta['names'].append('std: <= ' + str(self.intervals[index]) + ' < ' + str(self.intervals[index + 1]))
-
-        if not self.ignore_out_of_range:
-            self.meta['names'].append('mean: > ' + str(self.intervals[-1]))
-            self.meta['names'].append('std: > ' + str(self.intervals[-1]))
+        self._create_meta()
 
     def update(self, annotation, prediction):
         index = find_interval(annotation.value, self.intervals)
-        self.magnitude[index].append(self.value_differ(annotation.value, prediction.value))
+        diff = self.value_differ(annotation.value, prediction.value)
+        self.magnitude[index].append(diff)
+
+        return diff
 
     def evaluate(self, annotations, predictions):
         if self.ignore_out_of_range:
@@ -138,8 +135,22 @@ def evaluate(self, annotations, predictions):
 
         return result
 
+    def _create_meta(self):
+        self.meta['names'] = ([])
+        if not self.ignore_out_of_range:
+            self.meta['names'] = (['mean: < ' + str(self.intervals[0]), 'std: < ' + str(self.intervals[0])])
+
+        for index in range(len(self.intervals) - 1):
+            self.meta['names'].append('mean: <= ' + str(self.intervals[index]) + ' < ' + str(self.intervals[index + 1]))
+            self.meta['names'].append('std: <= ' + str(self.intervals[index]) + ' < ' + str(self.intervals[index + 1]))
+
+        if not self.ignore_out_of_range:
+            self.meta['names'].append('mean: > ' + str(self.intervals[-1]))
+            self.meta['names'].append('std: > ' + str(self.intervals[-1]))
+
     def reset(self):
         self.magnitude = [[] for _ in range(len(self.intervals) + 1)]
+        self._create_meta()
 
 
 class MeanAbsoluteError(BaseRegressionMetric):
@@ -162,6 +173,10 @@ class RootMeanSquaredError(BaseRegressionMetric):
     def __init__(self, *args, **kwargs):
         super().__init__(mse_differ, *args, **kwargs)
 
+    def update(self, annotation, prediction):
+        mse = super().update(annotation, prediction)
+        return np.sqrt(mse)
+
     def evaluate(self, annotations, predictions):
         return np.sqrt(np.mean(self.magnitude)), np.sqrt(np.std(self.magnitude))
 
@@ -186,6 +201,10 @@ class RootMeanSquaredErrorOnInterval(BaseRegressionOnIntervals):
     def __init__(self, *args, **kwargs):
         super().__init__(mse_differ, *args, **kwargs)
 
+    def update(self, annotation, prediction):
+        mse = super().update(annotation, prediction)
+        return np.sqrt(mse)
+
     def evaluate(self, annotations, predictions):
         if self.ignore_out_of_range:
             self.magnitude = self.magnitude[1:-1]
@@ -211,7 +230,9 @@ class FacialLandmarksPerPointNormedError(PerImageEvaluationMetric):
     prediction_types = (FacialLandmarksPrediction, )
 
     def configure(self):
-        self.meta.update({'scale': 1, 'postfix': ' ', 'calculate_mean': True, 'data_format': '{:.4f}'})
+        self.meta.update({
+            'scale': 1, 'postfix': ' ', 'calculate_mean': True, 'data_format': '{:.4f}', 'target': 'higher-worse'
+        })
         self.magnitude = []
 
     def update(self, annotation, prediction):
@@ -221,6 +242,8 @@ def update(self, annotation, prediction):
         result /= np.maximum(annotation.interocular_distance, np.finfo(np.float64).eps)
         self.magnitude.append(result)
 
+        return result
+
     def evaluate(self, annotations, predictions):
         num_points = np.shape(self.magnitude)[1]
         point_result_name_pattern = 'point_{}_normed_error'
@@ -263,7 +286,7 @@ def configure(self):
             'postfix': ' ',
             'calculate_mean': not self.calculate_std or not self.percentile,
             'data_format': '{:.4f}',
-            'names': ['mean']
+            'target': 'higher-worse'
         })
         self.magnitude = []
 
@@ -275,7 +298,10 @@ def update(self, annotation, prediction):
         avg_result /= np.maximum(annotation.interocular_distance, np.finfo(np.float64).eps)
         self.magnitude.append(avg_result)
 
+        return avg_result
+
     def evaluate(self, annotations, predictions):
+        self.meta['names'] = ['mean']
         result = [np.mean(self.magnitude)]
 
         if self.calculate_std:
@@ -342,6 +368,7 @@ def parameters(cls):
 
     def __init__(self, *args, **kwargs):
         super().__init__(self._psnr_differ, *args, **kwargs)
+        self.meta['target'] = 'higher-better'
 
     def configure(self):
         super().configure()
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/reid.py b/tools/accuracy_checker/accuracy_checker/metrics/reid.py
index c006e2459a8..46bee22b012 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/reid.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/reid.py
@@ -14,10 +14,8 @@
 limitations under the License.
 """
 
+import warnings
 from collections import defaultdict, namedtuple
-from sklearn.metrics import auc, precision_recall_curve
-# noinspection PyProtectedMember
-from sklearn.metrics.base import _average_binary_score
 import numpy as np
 
 from ..representation import (
@@ -28,9 +26,34 @@
 from ..config import BaseField, BoolField, NumberField
 from .metric import FullDatasetEvaluationMetric
 
+try:
+    from sklearn.metrics import auc, precision_recall_curve
+except ImportError:
+    auc, precision_recall_curve = None, None
+
 PairDesc = namedtuple('PairDesc', 'image1 image2 same')
 
 
+def _average_binary_score(binary_metric, y_true, y_score):
+    def binary_target(y):
+        return not (len(np.unique(y)) > 2) or (y.ndim >= 2 and len(y[0]) > 1)
+
+    if binary_target(y_true):
+        return binary_metric(y_true, y_score)
+
+    y_true = y_true.ravel()
+    y_score = y_score.ravel()
+
+    n_classes = y_score.shape[1]
+    score = np.zeros((n_classes,))
+    for c in range(n_classes):
+        y_true_c = y_true.take([c], axis=1).ravel()
+        y_score_c = y_score.take([c], axis=1).ravel()
+        score[c] = binary_metric(y_true_c, y_score_c)
+
+    return score
+
+
 class CMCScore(FullDatasetEvaluationMetric):
     """
     Cumulative Matching Characteristics (CMC) score.
@@ -83,6 +106,9 @@ def configure(self):
 
     def evaluate(self, annotations, predictions):
         dist_matrix = distance_matrix(annotations, predictions)
+        if np.size(dist_matrix) == 0:
+            warnings.warn('Gallery and query ids are not matched. CMC score can not be calculated.')
+            return 0
         gallery_cameras, gallery_pids, query_cameras, query_pids = get_gallery_query_pids(annotations)
 
         _cmc_score = eval_cmc(
@@ -124,6 +150,9 @@ def configure(self):
 
     def evaluate(self, annotations, predictions):
         dist_matrix = distance_matrix(annotations, predictions)
+        if np.size(dist_matrix) == 0:
+            warnings.warn('Gallery and query ids are not matched. ReID mAP can not be calculated.')
+            return 0
         gallery_cameras, gallery_pids, query_cameras, query_pids = get_gallery_query_pids(annotations)
 
         return eval_map(
@@ -155,6 +184,8 @@ def configure(self):
 
     def evaluate(self, annotations, predictions):
         embed_distances, pairs = get_embedding_distances(annotations, predictions)
+        if not pairs:
+            return np.nan
 
         min_score = self.min_score
         if min_score == 'train_median':
@@ -184,17 +215,20 @@ class PairwiseAccuracySubsets(FullDatasetEvaluationMetric):
 
     @classmethod
     def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
+        params = super().parameters()
+        params.update({
             'subset_number': NumberField(
                 optional=True, min_value=1, value_type=int, default=10, description="Number of subsets for separating."
             )
         })
-        return parameters
+        return params
 
     def configure(self):
         self.subset_num = self.get_value_from_config('subset_number')
-        self.accuracy_metric = PairwiseAccuracy(self.config, self.dataset)
+        config_copy = self.config.copy()
+        if 'subset_number' in config_copy:
+            config_copy.pop('subset_number')
+        self.accuracy_metric = PairwiseAccuracy(config_copy, self.dataset)
 
     def evaluate(self, annotations, predictions):
         subset_results = []
@@ -211,9 +245,10 @@ def evaluate(self, annotations, predictions):
             train_subset = self.mark_subset(train_subset)
 
             subset_result = self.accuracy_metric.evaluate(test_subset+train_subset, predictions)
-            subset_results.append(subset_result)
+            if not np.isnan(subset_result):
+                subset_results.append(subset_result)
 
-        return np.mean(subset_results)
+        return np.mean(subset_results) if subset_results else 0
 
     @staticmethod
     def make_subsets(subset_num, dataset_size):
@@ -248,7 +283,8 @@ def get_subset(container, subset_bounds):
 
 
 def extract_embeddings(annotation, prediction, query):
-    return np.stack([pred.embedding for pred, ann in zip(prediction, annotation) if ann.query == query])
+    embeddings = [pred.embedding for pred, ann in zip(prediction, annotation) if ann.query == query]
+    return np.stack(embeddings) if embeddings else embeddings
 
 
 def get_gallery_query_pids(annotation):
@@ -263,8 +299,9 @@ def get_gallery_query_pids(annotation):
 def distance_matrix(annotation, prediction):
     gallery_embeddings = extract_embeddings(annotation, prediction, query=False)
     query_embeddings = extract_embeddings(annotation, prediction, query=True)
+    not_empty = np.size(gallery_embeddings) > 0 and np.size(query_embeddings) > 0
 
-    return 1. - np.matmul(gallery_embeddings, np.transpose(query_embeddings)).T
+    return 1. - np.matmul(gallery_embeddings, np.transpose(query_embeddings)).T if not_empty else []
 
 
 def unique_sample(ids_dict, num):
@@ -378,20 +415,28 @@ def get_embedding_distances(annotation, prediction, train=False):
         if train != image1.metadata.get("train", False):
             continue
 
+        if image1.identifier not in image_indexes:
+            continue
+
         for image2 in image1.positive_pairs:
-            pairs.append(PairDesc(image_indexes[image1.identifier], image_indexes[image2], True))
+            if image2 in image_indexes:
+                pairs.append(PairDesc(image_indexes[image1.identifier], image_indexes[image2], True))
         for image2 in image1.negative_pairs:
-            pairs.append(PairDesc(image_indexes[image1.identifier], image_indexes[image2], False))
-
-    embed1 = np.asarray([prediction[idx].embedding for idx, _, _ in pairs])
-    embed2 = np.asarray([prediction[idx].embedding for _, idx, _ in pairs])
+            if image2 in image_indexes:
+                pairs.append(PairDesc(image_indexes[image1.identifier], image_indexes[image2], False))
 
-    return 0.5 * (1 - np.sum(embed1 * embed2, axis=1)), pairs
+    if pairs:
+        embed1 = np.asarray([prediction[idx].embedding for idx, _, _ in pairs])
+        embed2 = np.asarray([prediction[idx].embedding for _, idx, _ in pairs])
+        return 0.5 * (1 - np.sum(embed1 * embed2, axis=1)), pairs
+    return None, pairs
 
 
 def binary_average_precision(y_true, y_score, interpolated_auc=True):
-    def _average_precision(y_true_, y_score_, sample_weight=None):
-        precision, recall, _ = precision_recall_curve(y_true_, y_score_, sample_weight)
+    if auc is None:
+        raise ValueError('please install sklearn')
+    def _average_precision(y_true_, y_score_):
+        precision, recall, _ = precision_recall_curve(y_true_, y_score_)
         if not interpolated_auc:
             # Return the step function integral
             # The following works because the last entry of precision is
@@ -400,4 +445,4 @@ def _average_precision(y_true_, y_score_, sample_weight=None):
 
         return auc(recall, precision)
 
-    return _average_binary_score(_average_precision, y_true, y_score, average="macro")
+    return _average_binary_score(_average_precision, y_true, y_score)
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/semantic_segmentation.py b/tools/accuracy_checker/accuracy_checker/metrics/semantic_segmentation.py
index bab6877f18c..78440e1b462 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/semantic_segmentation.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/semantic_segmentation.py
@@ -16,7 +16,7 @@
 
 import numpy as np
 
-from ..config import BoolField
+from ..config import BoolField, ConfigError
 from ..representation import (
     SegmentationAnnotation,
     SegmentationPrediction,
@@ -49,27 +49,39 @@ def evaluate(self, annotations, predictions):
 
     def configure(self):
         self.use_argmax = self.get_value_from_config('use_argmax')
+        if not self.dataset.labels:
+            raise ConfigError('semantic segmentation metrics require label_map providing in dataset_meta'
+                              'Please provide dataset meta file or regenerated annotation')
 
     def update(self, annotation, prediction):
         n_classes = len(self.dataset.labels)
         prediction_mask = np.argmax(prediction.mask, axis=0) if self.use_argmax else prediction.mask.astype('int64')
 
-        def update_confusion_matrix(confusion_matrix):
+        def confusion_matrix():
             label_true = annotation.mask.flatten()
             label_pred = prediction_mask.flatten()
             mask = (label_true >= 0) & (label_true < n_classes) & (label_pred < n_classes) & (label_pred >= 0)
             hist = np.bincount(n_classes * label_true[mask].astype(int) + label_pred[mask], minlength=n_classes ** 2)
             hist = hist.reshape(n_classes, n_classes)
-            confusion_matrix += hist
 
-            return confusion_matrix
+            return hist
 
-        self._update_state(update_confusion_matrix, self.CONFUSION_MATRIX_KEY, lambda: np.zeros((n_classes, n_classes)))
+        def accumulate(confusion_matrixs):
+            return confusion_matrixs + cm
+
+        cm = confusion_matrix()
+
+        self._update_state(accumulate, self.CONFUSION_MATRIX_KEY, lambda: np.zeros((n_classes, n_classes)))
+        return cm
 
 
 class SegmentationAccuracy(SegmentationMetric):
     __provider__ = 'segmentation_accuracy'
 
+    def update(self, annotation, prediction):
+        cm = super().update(annotation, prediction)
+        return np.diag(cm).sum() / cm.sum()
+
     def evaluate(self, annotations, predictions):
         confusion_matrix = self.state[self.CONFUSION_MATRIX_KEY]
         return np.diag(confusion_matrix).sum() / confusion_matrix.sum()
@@ -78,11 +90,19 @@ def evaluate(self, annotations, predictions):
 class SegmentationIOU(SegmentationMetric):
     __provider__ = 'mean_iou'
 
+    def update(self, annotation, prediction):
+        cm = super().update(annotation, prediction)
+        diagonal = np.diag(cm).astype(float)
+        union = cm.sum(axis=1) + cm.sum(axis=0) - diagonal
+        iou = np.divide(diagonal, union, out=np.full_like(diagonal, np.nan), where=union != 0)
+
+        return iou
+
     def evaluate(self, annotations, predictions):
         confusion_matrix = self.state[self.CONFUSION_MATRIX_KEY]
-        union = confusion_matrix.sum(axis=1) + confusion_matrix.sum(axis=0) - np.diag(confusion_matrix)
         diagonal = np.diag(confusion_matrix)
-        iou = np.divide(diagonal, union, out=np.zeros_like(diagonal), where=union != 0)
+        union = confusion_matrix.sum(axis=1) + confusion_matrix.sum(axis=0) - diagonal
+        iou = np.divide(diagonal, union, out=np.full_like(diagonal, np.nan), where=union != 0)
 
         values, names = finalize_metric_result(iou, list(self.dataset.labels.values()))
         self.meta['names'] = names
@@ -93,11 +113,19 @@ def evaluate(self, annotations, predictions):
 class SegmentationMeanAccuracy(SegmentationMetric):
     __provider__ = 'mean_accuracy'
 
+    def update(self, annotation, prediction):
+        cm = super().update(annotation, prediction)
+        diagonal = np.diag(cm).astype(float)
+        per_class_count = cm.sum(axis=1)
+        acc_cls = np.divide(diagonal, per_class_count, out=np.full_like(diagonal, np.nan), where=per_class_count != 0)
+
+        return acc_cls
+
     def evaluate(self, annotations, predictions):
         confusion_matrix = self.state[self.CONFUSION_MATRIX_KEY]
         diagonal = np.diag(confusion_matrix)
         per_class_count = confusion_matrix.sum(axis=1)
-        acc_cls = np.divide(diagonal, per_class_count, out=np.zeros_like(diagonal), where=per_class_count != 0)
+        acc_cls = np.divide(diagonal, per_class_count, out=np.full_like(diagonal, np.nan), where=per_class_count != 0)
 
         values, names = finalize_metric_result(acc_cls, list(self.dataset.labels.values()))
         self.meta['names'] = names
@@ -108,11 +136,19 @@ def evaluate(self, annotations, predictions):
 class SegmentationFWAcc(SegmentationMetric):
     __provider__ = 'frequency_weighted_accuracy'
 
+    def update(self, annotation, prediction):
+        cm = super().update(annotation, prediction)
+        diagonal = np.diag(cm).astype(float)
+        union = cm.sum(axis=1) + cm.sum(axis=0) - diagonal
+        iou = np.divide(diagonal, union, out=np.zeros_like(diagonal), where=union != 0)
+        freq = cm.sum(axis=1) / cm.sum()
+
+        return (freq[freq > 0] * iou[freq > 0]).sum()
+
     def evaluate(self, annotations, predictions):
         confusion_matrix = self.state[self.CONFUSION_MATRIX_KEY]
-
-        union = (confusion_matrix.sum(axis=1) + confusion_matrix.sum(axis=0) - np.diag(confusion_matrix))
         diagonal = np.diag(confusion_matrix)
+        union = confusion_matrix.sum(axis=1) + confusion_matrix.sum(axis=0) - diagonal
         iou = np.divide(diagonal, union, out=np.zeros_like(diagonal), where=union != 0)
         freq = confusion_matrix.sum(axis=1) / confusion_matrix.sum()
 
@@ -126,14 +162,15 @@ class SegmentationDSCAcc(PerImageEvaluationMetric):
     overall_metric = []
 
     def update(self, annotation, prediction):
-        cnt = 0
+        result = []
         for prediction_mask, annotation_mask in zip(prediction.mask, annotation.mask):
             annotation_mask = np.transpose(annotation_mask, (2, 0, 1))
             annotation_mask = np.expand_dims(annotation_mask, 0)
             numerator = np.sum(prediction_mask * annotation_mask) * 2.0 + 1.0
             denominator = np.sum(annotation_mask) + np.sum(prediction_mask) + 1.0
-            self.overall_metric.append(numerator / denominator)
-            cnt += 1
+            result.append(numerator / denominator)
+        self.overall_metric.extend(result)
+        return np.mean(result)
 
     def evaluate(self, annotations, predictions):
         return sum(self.overall_metric) / len(self.overall_metric)
@@ -144,8 +181,8 @@ def reset(self):
 
 class SegmentationDIAcc(PerImageEvaluationMetric):
     __provider__ = 'dice_index'
-    annotation_types = (BrainTumorSegmentationAnnotation,)
-    prediction_types = (BrainTumorSegmentationPrediction,)
+    annotation_types = (BrainTumorSegmentationAnnotation, SegmentationAnnotation)
+    prediction_types = (BrainTumorSegmentationPrediction, SegmentationPrediction)
 
     overall_metric = []
 
@@ -154,7 +191,7 @@ def parameters(cls):
         parameters = super().parameters()
         parameters.update({
             'mean': BoolField(optional=True, default=True, description='Allows calculation mean value.'),
-            'median': BoolField(optional=True, default=False, description='Allows calculation median value.')
+            'median': BoolField(optional=True, default=False, description='Allows calculation median value.'),
         })
 
         return parameters
@@ -162,8 +199,9 @@ def parameters(cls):
     def configure(self):
         self.mean = self.get_value_from_config('mean')
         self.median = self.get_value_from_config('median')
+        self.output_order = self.get_value_from_config('output_order')
 
-        labels = self.dataset.labels if self.dataset.metadata else ['overall']
+        labels = list(self.dataset.labels.values()) if self.dataset.metadata else ['overall']
         self.classes = len(labels)
 
         names_mean = ['mean@{}'.format(name) for name in labels] if self.mean else []
@@ -178,11 +216,16 @@ def update(self, annotation, prediction):
         result = np.zeros(shape=self.classes)
 
         annotation_data = annotation.mask
-        prediction_data = np.argmax(prediction.mask, axis=0)
+        prediction_data = prediction.mask
+
+        if prediction_data.shape[0] != 1 and len(prediction_data.shape) != 3:
+            raise RuntimeError("For '{}' metric prediction mask should has only 1 channel, but more found. "
+                               "Specify 'make_argmax' option in adapter or postprocessor."
+                               .format(self.__provider__))
 
-        for c in range(1, self.classes):
+        for c, p in enumerate(prediction.label_order, 1):
             annotation_data_ = (annotation_data == c)
-            prediction_data_ = (prediction_data == c)
+            prediction_data_ = (prediction_data == p)
 
             intersection_count = np.logical_and(annotation_data_, prediction_data_).sum()
             union_count = annotation_data_.sum() + prediction_data_.sum()
@@ -199,6 +242,8 @@ def update(self, annotation, prediction):
 
         self.overall_metric.append(result)
 
+        return result
+
     def evaluate(self, annotations, predictions):
         mean = np.mean(self.overall_metric, axis=0) if self.mean else []
         median = np.median(self.overall_metric, axis=0) if self.median else []
@@ -206,4 +251,10 @@ def evaluate(self, annotations, predictions):
         return result
 
     def reset(self):
+        labels = self.dataset.labels.values() if self.dataset.metadata else ['overall']
+        self.classes = len(labels)
+        names_mean = ['mean@{}'.format(name) for name in labels] if self.mean else []
+        names_median = ['median@{}'.format(name) for name in labels] if self.median else []
+        self.meta['names'] = names_mean + names_median
+        self.meta['calculate_mean'] = False
         self.overall_metric = []
diff --git a/tools/accuracy_checker/accuracy_checker/metrics/text_detection.py b/tools/accuracy_checker/accuracy_checker/metrics/text_detection.py
index f0d7a204ea0..fa6dfbb9c7a 100644
--- a/tools/accuracy_checker/accuracy_checker/metrics/text_detection.py
+++ b/tools/accuracy_checker/accuracy_checker/metrics/text_detection.py
@@ -142,6 +142,7 @@ def configure(self):
         self.one_to_one_match_score = self.get_value_from_config('one_to_one_match_score')
         self.one_to_many_match_score = self.get_value_from_config('one_to_many_match_score')
         self.many_to_one_match_score = self.get_value_from_config('many_to_one_match_score')
+        self.word_spotting = self.get_value_from_config('word_spotting')
         self.num_valid_gt = 0
         self.num_valid_detections = 0
         self.precision_sum = 0
@@ -176,7 +177,7 @@ def update(self, annotation, prediction):
             precision = 0 if num_det > 0 else 1
             self.precision_sum += precision
             self.recall_sum += recall
-            return
+            return precision, recall, num_valid_gt, num_valid_pred
 
         recall_accum = 0
         precision_accum = 0
@@ -218,6 +219,8 @@ def update(self, annotation, prediction):
         self.recall_sum += recall
         self.precision_sum += precision
 
+        return precision, recall, num_valid_gt, num_valid_pred
+
     def evaluate(self, annotations, predictions):
         raise NotImplementedError()
 
@@ -362,6 +365,10 @@ def reset(self):
 class FocusedTextLocalizationPrecision(FocusedTextLocalizationMetric):
     __provider__ = 'focused_text_precision'
 
+    def update(self, annotation, prediction):
+        precision, _, _, num_valid_dt = super().update(annotation, prediction)
+        return precision / num_valid_dt if num_valid_dt != 0 else 0
+
     def evaluate(self, annotations, predictions):
         return self.precision_sum / self.num_valid_detections if self.num_valid_detections != 0 else 0
 
@@ -369,6 +376,10 @@ def evaluate(self, annotations, predictions):
 class FocusedTextLocalizationRecall(FocusedTextLocalizationMetric):
     __provider__ = 'focused_text_recall'
 
+    def update(self, annotation, prediction):
+        precision, _, num_valid_gt, _ = super().update(annotation, prediction)
+        return precision / num_valid_gt if num_valid_gt != 0 else 0
+
     def evaluate(self, annotations, predictions):
         return self.recall_sum / self.num_valid_gt if self.num_valid_gt != 0 else 0
 
@@ -376,6 +387,13 @@ def evaluate(self, annotations, predictions):
 class FocusedTextLocalizationHMean(FocusedTextLocalizationMetric):
     __provider__ = 'focused_text_hmean'
 
+    def update(self, annotation, prediction):
+        precision, recall, num_valid_gt, num_valid_dt = super().update(annotation, prediction)
+        overall_p = precision / num_valid_dt if num_valid_dt != 0 else 0
+        overall_r = recall / num_valid_gt if num_valid_gt != 0 else 0
+
+        return 2 * overall_r * overall_p / (overall_r + overall_p) if overall_r + overall_p != 0 else 0
+
     def evaluate(self, annotations, predictions):
         recall = self.recall_sum / self.num_valid_gt if self.num_valid_gt != 0 else 0
         precision = self.precision_sum / self.num_valid_detections if self.num_valid_detections != 0 else 0
@@ -403,6 +421,10 @@ def parameters(cls):
                 min_value=0, max_value=1, optional=True, default=0.5,
                 description="Minimal value for intersection over union that allows to make decision "
                             "that prediction polygon matched with ignored annotation."
+            ),
+            'word_spotting': BoolField(
+                optional=True, default=False,
+                description="Allows to use transcriptions in order to compute word spotting metrics"
             )
         })
 
@@ -412,13 +434,18 @@ def configure(self):
         self.iou_constrain = self.get_value_from_config('iou_constrain')
         self.area_precision_constrain = self.get_value_from_config('area_precision_constrain')
         self.ignore_difficult = self.get_value_from_config('ignore_difficult')
+        self.word_spotting = self.get_value_from_config('word_spotting')
         self.number_matched_detections = 0
         self.number_valid_annotations = 0
         self.number_valid_detections = 0
 
     def update(self, annotation, prediction):
         gt_polygons = list(map(polygon_from_points, annotation.points))
+        gt_texts = list(annotation.description)
+
         prediction_polygons = list(map(polygon_from_points, prediction.points))
+        prediction_texts = list(prediction.description)
+
         num_gt = len(gt_polygons)
         num_det = len(prediction_polygons)
         gt_difficult_mask = np.full(num_gt, False)
@@ -432,7 +459,8 @@ def update(self, annotation, prediction):
             for det_id, detection_polygon in enumerate(prediction_polygons):
                 for gt_difficult_id in gt_difficult_inds:
                     gt_difficult_polygon = gt_polygons[gt_difficult_id]
-                    intersected_area = get_intersection_area(gt_difficult_polygon, detection_polygon)
+                    intersected_area = get_intersection_area(gt_difficult_polygon,
+                                                             detection_polygon)
                     pd_dimensions = detection_polygon.area
                     precision = 0 if pd_dimensions == 0 else intersected_area / pd_dimensions
 
@@ -451,7 +479,12 @@ def update(self, annotation, prediction):
                     not_matched_before = gt_matched[gt_id] == 0 and det_matched[pred_id] == 0
                     not_difficult = not gt_difficult_mask[gt_id] and not prediction_difficult_mask[pred_id]
                     if not_matched_before and not_difficult:
-                        if iou_matrix[gt_id, pred_id] >= self.iou_constrain:
+                        iou_big_enough = iou_matrix[gt_id, pred_id] >= self.iou_constrain
+                        if not self.word_spotting:
+                            transcriptions_equal = True
+                        else:
+                            transcriptions_equal = gt_texts[gt_id].lower() == prediction_texts[pred_id].lower()
+                        if iou_big_enough and transcriptions_equal:
                             gt_matched[gt_id] = 1
                             det_matched[pred_id] = 1
                             num_det_matched += 1
@@ -465,6 +498,8 @@ def update(self, annotation, prediction):
         self.number_valid_annotations += num_valid_gt
         self.number_valid_detections += num_valid_pred
 
+        return num_det_matched, num_valid_gt, num_valid_pred
+
     def evaluate(self, annotations, predictions):
         raise NotImplementedError()
 
@@ -477,6 +512,10 @@ def reset(self):
 class IncidentalSceneTextLocalizationPrecision(IncidentalSceneTextLocalizationMetric):
     __provider__ = 'incidental_text_precision'
 
+    def update(self, annotation, prediction):
+        num_det_matched, _, num_valid_dt = super().update(annotation, prediction)
+        return 0 if num_valid_dt == 0 else float(num_det_matched) / num_valid_dt
+
     def evaluate(self, annotations, predictions):
         precision = (
             0 if self.number_valid_detections == 0
@@ -489,6 +528,10 @@ def evaluate(self, annotations, predictions):
 class IncidentalSceneTextLocalizationRecall(IncidentalSceneTextLocalizationMetric):
     __provider__ = 'incidental_text_recall'
 
+    def update(self, annotation, prediction):
+        num_det_matched, num_valid_gt, _ = super().update(annotation, prediction)
+        return 0 if num_valid_gt == 0 else float(num_det_matched) / num_valid_gt
+
     def evaluate(self, annotations, predictions):
         recall = (
             0 if self.number_valid_annotations == 0
@@ -501,6 +544,13 @@ def evaluate(self, annotations, predictions):
 class IncidentalSceneTextLocalizationHMean(IncidentalSceneTextLocalizationMetric):
     __provider__ = 'incidental_text_hmean'
 
+    def update(self, annotation, prediction):
+        num_det_matched, num_valid_gt, num_valid_pred = super().update(annotation, prediction)
+        precision = 0 if num_valid_pred == 0 else num_det_matched / num_valid_pred
+        recall = 0 if num_valid_gt == 0 else num_det_matched / num_valid_gt
+
+        return 0 if precision + recall == 0 else 2 * recall * precision / (recall + precision)
+
     def evaluate(self, annotations, predictions):
         recall = (
             0 if self.number_valid_annotations == 0
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/README.md b/tools/accuracy_checker/accuracy_checker/postprocessor/README.md
index b444fb0fbf1..01a31e6b154 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/README.md
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/README.md
@@ -1,13 +1,13 @@
 # Postprocessors
 
-Postprocessor is function which processes prediction and/or annotation data after model infer and before metric calculation. For correct work postprocessors require specific representation format. 
-(e. g. clip boxes postprocessor expects detection annotation and detection prediction for processing). 
+Postprocessor is function which processes prediction and/or annotation data after model infer and before metric calculation. For correct work postprocessors require specific representation format.
+(e. g. clip boxes postprocessor expects detection annotation and detection prediction for processing).
 
-In case when you use complicated representation located in representation container, you can add options `annotation_source` and `prediction_source` in configuration file, 
-if you want process only specific representations, another way postprocessor will be used for all suitable representations. `annotation_source` and `prediction_source` should contain 
+In case when you use complicated representation located in representation container, you can add options `annotation_source` and `prediction_source` in configuration file,
+if you want process only specific representations, another way postprocessor will be used for all suitable representations. `annotation_source` and `prediction_source` should contain
 comma separated list of annotation identifiers and output layer names respectively.
 
-Every postprocessor has parameters available for configuration. 
+Every postprocessor has parameters available for configuration.
 
 Accuracy Checker supports following set of postprocessors:
 
@@ -22,7 +22,7 @@ Accuracy Checker supports following set of postprocessors:
   * `dst_width` and `dst_height` - destination width and height respectively. You can also use `size` instead in case when destination sizes are equal.
 * `resize_prediction_boxes` - resizing normalized detection prediction boxes according to image size. Supported representations: `DetectionAnotation`, `DetectionPrediction`.
 * `faster_rcnn_postprocessing_resize` - resizing normalized detection prediction boxes according to the original image size before preprocessing steps.
-    Supported representations: `DetectionAnotation`, `DetectionPrediction`.     
+    Supported representations: `DetectionAnotation`, `DetectionPrediction`.
     At the moment works in the following cases only:
    - the preprocessing steps contains only one operation changing input image size, and the operation is `resize`
    - the preprocessing steps contains only two operations changing input image size, and the operations are `resize` and then `padding`.
@@ -43,7 +43,7 @@ Accuracy Checker supports following set of postprocessors:
   * `apply_to` - determines target masks for processing (`annotation` for ground truth and `prediction` for detection results, `all` for both).
   **Note:** this postprocessing requires specific dataset meta: `segmentation_colors` for annotations and `prediction_to_gt_labels` for predictions.
 * `resize_segmentation_mask` - resizing segmentation mask. Supported representations: `SegmentationAnotation`, `SegmentationPrediction`.
-  * `dst_width` and `dst_height` - destination width and height for box clipping respectively. You can also use `size` instead in case when destination sizes are equal. 
+  * `dst_width` and `dst_height` - destination width and height for resize respectively. You can also use `size` instead in case when destination sizes are equal.
     If any of these parameters are not specified, image size will be used as default.
   * `apply_to` - determines target masks for processing (`annotation` for ground truth and `prediction` for detection results, `all` for both).
 * `extend_segmentation_mask` - extending annotation segmentation mask to predicted mask size making border filled by specific value. Supported representations: `SegmentationAnotation`, `SegmentationPrediction`.
@@ -56,4 +56,15 @@ Accuracy Checker supports following set of postprocessors:
 * `clip_segmentation_mask` - clipping segmentation mask values. Supported representations: `BrainTumorSegmentationAnnotation`, `BrainTumorSegmentationPrediction`.
   * `min_value` - lower bound of range.
   * `max_value` - upper bound of range.
-* `segmentation-prediction-resample` - resamples output prediction in two steps: 1) resizes it to bounding box size; 2) extends to annotation size. Supported representations: `BrainTumorSegmentationAnnotation`, `BrainTumorSegmentationPrediction`. For correct bounding box size must be set via tag `boxes_file` in `brats_numpy` [converter](../annotation_converters/README.md).
+* `segmentation_prediction_resample` - resamples output prediction in two steps: 1) resizes it to bounding box size; 2) extends to annotation size. Supported representations: `BrainTumorSegmentationAnnotation`, `BrainTumorSegmentationPrediction`. For correct bounding box size must be set via tag `boxes_file` in `brats_numpy` [converter](../annotation_converters/README.md) or `crop_brats` [preprocessor](../preprocessor/README.md).
+  * `make_argmax` - applies argmax operation to prediction mask after resampling (by default `False`). Must be specified only one option `make_argmax`.
+* `transform_brats_prediction` - transforms prediction from `WT-TC-ET` format to `NCR/NET-ED-ET`. Sequentially fills one-channel mask with specified `values` for elements passing the threshold (threshold is `0.5`) from each prediction channel in specified `order`.
+  * `order` - specifies filling order for channels
+  * `values` - specifies values for each channel according to new order
+* `extract_prediction_answers` - extract predicted sequence of tokens from annotation text. Supported representations: `QuestionAnsweringAnnotation`, `QuestionAnsweringPrediction`.
+  * `max_answer` - maximum answer length (Optional, default value is 30).
+  * `n_best_size` - total number of n-best prediction size for the answer (Optional, default value is 20).
+* `translate_3d_poses` - translating 3D poses. Supported representations: `PoseEstimation3dAnnotation`, `PoseEstimation3dPrediction`. Shifts 3D coordinates of each predicted poses on corresponding translation vector.
+* `resize_super_resolution` - resizing super resolution predicted image. Supported representations: `SuperResolutionAnotation`, `SuperResolutionPrediction`.
+  * `dst_width` and `dst_height` - destination width and height for resizing respectively. You can also use `size` instead in case when destination sizes are equal.
+    If any of these parameters are not specified, gt high resolution image size will be used as default.
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/__init__.py b/tools/accuracy_checker/accuracy_checker/postprocessor/__init__.py
index 8905d186add..67fe696bc40 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/__init__.py
@@ -42,7 +42,11 @@
 from .crop_segmentation_mask import CropSegmentationMask
 from .clip_segmentation_mask import ClipSegmentationMask
 from .normalize_boxes import NormalizeBoxes
-from .resample_segmentation_prediction import SegmentationPredictionResample
+from .brats_postprocessing import SegmentationPredictionResample, TransformBratsPrediction
+from .extract_answers_tokens import ExtractSQUADPrediction
+from .translate_3d_poses import Translate3dPoses
+from .normalize_recomendation import MinMaxNormalizeRecommendation, SigmoidNormalizeRecommendation
+from .resize_super_resolution import ResizeSuperResolution
 
 __all__ = [
     'Postprocessor',
@@ -71,7 +75,18 @@
     'ZoomSegMask',
     'CropSegmentationMask',
     'ClipSegmentationMask',
+
     'SegmentationPredictionResample',
+    'TransformBratsPrediction',
+
+    'NormalizeLandmarksPoints',
+
+    'ExtractSQUADPrediction',
+
+    'Translate3dPoses',
+
+    'SigmoidNormalizeRecommendation',
+    'MinMaxNormalizeRecommendation',
 
-    'NormalizeLandmarksPoints'
+    'ResizeSuperResolution'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/brats_postprocessing.py b/tools/accuracy_checker/accuracy_checker/postprocessor/brats_postprocessing.py
new file mode 100644
index 00000000000..648c805e84d
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/brats_postprocessing.py
@@ -0,0 +1,133 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import numpy as np
+from .postprocessor import Postprocessor
+from ..config import ConfigError, BoolField, ListField, NumberField
+from ..representation import BrainTumorSegmentationPrediction, BrainTumorSegmentationAnnotation
+try:
+    from scipy.ndimage import interpolation
+except ImportError:
+    interpolation = None
+
+
+def resample(data, shape):
+    if interpolation is None:
+        raise ValueError('scipy required, please install it')
+    if len(data.shape) != len(shape):
+        raise RuntimeError('Dimensions of input array and shape are different. Resampling is impossible.')
+    factor = [float(o) / i for i, o in zip(data.shape, shape)]
+    return interpolation.zoom(data, zoom=factor, order=1)
+
+
+class SegmentationPredictionResample(Postprocessor):
+    __provider__ = "segmentation_prediction_resample"
+
+    prediction_types = (BrainTumorSegmentationPrediction, )
+    annotation_types = (BrainTumorSegmentationAnnotation, )
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'make_argmax': BoolField(optional=True, default=False,
+                                     description="Applies argmax operation for prediction")
+        })
+        return parameters
+
+    def configure(self):
+        self.make_argmax = self.config.get('make_argmax')
+
+    def process_image(self, annotations, predictions):
+        raise RuntimeError("Since `process_image_with_metadata` is overriden, this method MUST NOT be called")
+
+    def process_image_with_metadata(self, annotation, prediction, image_metadata=None):
+        if not len(annotation) == len(prediction) == 1:
+            raise RuntimeError('Postprocessor {} does not support multiple annotation and/or prediction.'
+                               .format(self.__provider__))
+
+        if annotation[0].box:
+            box = annotation[0].box
+        elif image_metadata['box'] is not None:
+            box = image_metadata['box']
+        else:
+            raise ValueError('Postprocessor {} not found bounding box.'.format(self.__provider__))
+
+        annotation_ = annotation[0]
+        prediction_ = prediction[0]
+
+        low = box[0, :]
+        high = box[1, :]
+        diff = (high - low).astype(np.int32)
+
+        annotation_shape = annotation_.mask.shape
+        prediction_shape = prediction_.mask.shape
+
+        image_shape = annotation_shape[-3:]
+        box_shape = (diff[0], diff[1], diff[2])
+
+        label = np.zeros(shape=(prediction_shape[0],) + image_shape)
+
+        label[:, low[0]:high[0], low[1]:high[1], low[2]:high[2]] = resample(
+            prediction_.mask, (prediction_shape[0],) + box_shape
+        )
+
+        if self.make_argmax:
+            label = np.argmax(label, axis=0).astype(np.int8)
+            label = np.expand_dims(label, axis=0)
+
+        prediction[0].mask = label
+
+        return annotation, prediction
+
+
+class TransformBratsPrediction(Postprocessor):
+    __provider__ = 'transform_brats_prediction'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'order': ListField(value_type=NumberField(value_type=int, min_value=0), validate_values=True,
+                               description="Specifies channel order of filling"),
+            'values': ListField(value_type=int, validate_values=True,
+                                description="Specifies values for each channel according to new order")
+        })
+        return parameters
+
+    def configure(self):
+        self.order = self.get_value_from_config('order')
+        self.values = self.get_value_from_config('values')
+        if len(self.order) != len(self.values):
+            raise ConfigError('Length of "order" and "values" must be the same')
+
+    def process_image(self, annotation, prediction):
+        if not len(annotation) == len(prediction) == 1:
+            raise RuntimeError('Postprocessor {} does not support multiple annotation and/or prediction.'
+                               .format(self.__provider__))
+        data = prediction[0].mask
+
+        result = np.zeros(shape=data.shape[1:], dtype=np.int8)
+
+        label = data > 0.5
+        for i, value in zip(self.order, self.values):
+            result[label[i, :, :, :]] = value
+
+        result = np.expand_dims(result, axis=0)
+
+        prediction[0].mask = result
+
+        return  annotation, prediction
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/extract_answers_tokens.py b/tools/accuracy_checker/accuracy_checker/postprocessor/extract_answers_tokens.py
new file mode 100644
index 00000000000..5c5e50e0d02
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/extract_answers_tokens.py
@@ -0,0 +1,100 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import numpy as np
+
+from .postprocessor import Postprocessor
+from ..representation import QuestionAnsweringAnnotation, QuestionAnsweringPrediction
+from ..config import NumberField
+
+
+class ExtractSQUADPrediction(Postprocessor):
+    """
+    Extract text answers from predictions
+    """
+
+    __provider__ = 'extract_answers_tokens'
+
+    annotation_types = (QuestionAnsweringAnnotation, )
+    prediction_types = (QuestionAnsweringPrediction, )
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'max_answer': NumberField(
+                optional=True, value_type=int, default=30, description="Maximum length of answer"
+            ),
+            'n_best_size': NumberField(
+                optional=True, value_type=int, default=20, description="The total number of n-best predictions."
+            )
+        })
+        return parameters
+
+    def configure(self):
+        self.max_answer = self.get_value_from_config('max_answer')
+        self.n_best_size = self.get_value_from_config('n_best_size')
+
+    def process_image(self, annotation, prediction):
+        def _get_best_indexes(logits, n_best_size):
+            indexes = np.argsort(logits)[::-1]
+            score = np.array(logits)[indexes]
+            best_indexes_mask = np.arange(len(score)) < n_best_size
+            best_indexes = indexes[best_indexes_mask]
+            return best_indexes
+
+        def _check_indexes(start, end, length, max_answer):
+            if start >= length or end >= length:
+                return False
+            if end < start or end - start + 1 > max_answer:
+                return False
+            return True
+
+        for annotation_, prediction_ in zip(annotation, prediction):
+            start_indexes = _get_best_indexes(prediction_.start_logits, self.n_best_size)
+            end_indexes = _get_best_indexes(prediction_.end_logits, self.n_best_size)
+            valid_start_indexes = []
+            valid_end_indexes = []
+            tokens = []
+
+            for start_index in start_indexes:
+                for end_index in end_indexes:
+                    if _check_indexes(start_index, end_index, len(annotation_.tokens), self.max_answer):
+                        valid_start_indexes.append(start_index)
+                        valid_end_indexes.append(end_index)
+                        tokens.append(annotation_.tokens[start_index:(end_index + 1)])
+
+            start_logits = prediction_.start_logits[valid_start_indexes]
+            end_logits = prediction_.end_logits[valid_end_indexes]
+
+            start_indexes = [val for _, val in sorted(zip(start_logits+end_logits, start_indexes), reverse=True)]
+            if not start_indexes:
+                continue
+            start_indexes_ = start_indexes[0]
+            end_indexes_ = [val for _, val in sorted(zip(start_logits+end_logits, end_indexes), reverse=True)]
+            end_indexes_ = end_indexes_[0]
+
+            prediction_.start_index.append(start_indexes_)
+            prediction_.end_index.append(end_indexes_)
+
+            tokens_ = [" ".join(tok) for _, tok in sorted(zip(start_logits+end_logits, tokens), reverse=True)]
+            tokens_ = tokens_[0]
+            tokens_ = tokens_.replace(" ##", "")
+            tokens_ = tokens_.replace("##", "")
+            tokens_ = tokens_.strip()
+            prediction_.tokens.append(tokens_)
+
+        return annotation, prediction
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/faster_rcnn_postprocessing_resize.py b/tools/accuracy_checker/accuracy_checker/postprocessor/faster_rcnn_postprocessing_resize.py
index 900d9528255..94f3f7ba058 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/faster_rcnn_postprocessing_resize.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/faster_rcnn_postprocessing_resize.py
@@ -43,7 +43,7 @@ def configure(self):
         self.dst_height, self.dst_width = get_size_from_config(self.config, allow_none=True)
 
     @staticmethod
-    def _get_coeff_x_y_from_metadata(image_metadata):
+    def get_coeff_x_y_from_metadata(image_metadata):
         assert image_metadata and 'geometric_operations' in image_metadata
         geometric_operations = image_metadata['geometric_operations'] # should be list of GeometricOperationMetadata
 
@@ -84,7 +84,7 @@ def process_image_with_metadata(self, annotations, predictions, image_metadata=N
         assert image_metadata and 'geometric_operations' in image_metadata, (
             "Postprocessing step `faster_rcnn_postprocessing_resize` cannot work without "
             "metadata with `geometric_operations` field")
-        coeff_x, coeff_y = self._get_coeff_x_y_from_metadata(image_metadata)
+        coeff_x, coeff_y = self.get_coeff_x_y_from_metadata(image_metadata)
 
         for prediction in predictions:
             prediction.x_mins *= coeff_x
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/filter.py b/tools/accuracy_checker/accuracy_checker/postprocessor/filter.py
index e7e223c3301..2a4fda1d3e9 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/filter.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/filter.py
@@ -321,8 +321,8 @@ class FilterInvalidBoxes(BaseFilter):
     __provider__ = 'invalid_boxes'
 
     def apply_filter(self, entry, invalid_boxes):
-        infinite_mask_x = np.logical_or(~np.isfinite(entry.x_mins), ~np.isfinite(entry.x_maxs))
-        infinite_mask_y = np.logical_or(~np.isfinite(entry.y_mins), ~np.isfinite(entry.y_maxs))
+        infinite_mask_x = np.logical_or(~np.isfinite(entry.x_mins), ~np.isfinite(entry.x_maxs)) # pylint: disable=E1130
+        infinite_mask_y = np.logical_or(~np.isfinite(entry.y_mins), ~np.isfinite(entry.y_maxs)) # pylint: disable=E1130
         infinite_mask = np.logical_or(infinite_mask_x, infinite_mask_y)
 
         return np.argwhere(infinite_mask).reshape(-1).tolist()
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/nms.py b/tools/accuracy_checker/accuracy_checker/postprocessor/nms.py
index a30003466f4..4b08704f12e 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/nms.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/nms.py
@@ -115,7 +115,7 @@ def nms(x1, y1, x2, y2, scores, thresh, include_boundaries=True, keep_top_k=None
             union = (areas[i] + areas[order[1:]] - intersection)
             overlap = np.divide(intersection, union, out=np.zeros_like(intersection, dtype=float), where=union != 0)
 
-            order = order[np.where(overlap <= thresh)[0] + 1]
+            order = order[np.where(overlap <= thresh)[0] + 1] # pylint: disable=W0143
 
         return keep
 
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/normalize_recomendation.py b/tools/accuracy_checker/accuracy_checker/postprocessor/normalize_recomendation.py
new file mode 100644
index 00000000000..09d498a0d43
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/normalize_recomendation.py
@@ -0,0 +1,52 @@
+import numpy as np
+from ..config import NumberField, ConfigError
+from ..postprocessor.postprocessor import Postprocessor
+from ..representation import HitRatioAnnotation, HitRatioPrediction
+
+
+class MinMaxNormalizeRecommendation(Postprocessor):
+    __provider__ = 'min_max_normalize_recommendation'
+
+    annotation_types = (HitRatioAnnotation, )
+    prediction_types = (HitRatioPrediction, )
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'min_value': NumberField(
+                optional=True, default=0, value_type=float, description="min value for scale range"
+            ),
+            'max_value': NumberField(
+                optional=True, default=1, value_type=float, description="max value for scale range"
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        self.min_value = self.get_value_from_config('min_value')
+        self.max_value = self.get_value_from_config('max_value')
+        if self.max_value == self.min_value:
+            raise ConfigError('max and min values can not be equal')
+
+    def process_image(self, annotation, prediction):
+        for target in prediction:
+            target.scores = (target.scores - self.min_value) / (self.max_value - self.min_value)
+
+        return annotation, prediction
+
+
+class SigmoidNormalizeRecommendation(Postprocessor):
+    __provider__ = 'sigmoid_normalize_recommendation'
+
+    annotation_types = (HitRatioAnnotation, )
+    prediction_types = (HitRatioPrediction, )
+
+    def process_image(self, annotation, prediction):
+        def sigmoid(x):
+            return 1 / (1 + np.exp(-x))
+        for target in prediction:
+            target.scores = sigmoid(target.scores)
+
+        return annotation, prediction
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessing_executor.py b/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessing_executor.py
index e124e378a78..a37549e012d 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessing_executor.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessing_executor.py
@@ -28,6 +28,8 @@ def __init__(self, processors=None, dataset_name='custom', dataset_meta=None, st
 
         self.state = state or {}
 
+        self.allow_image_postprocessor = True
+
         if not processors:
             return
 
@@ -37,19 +39,7 @@ def __init__(self, processors=None, dataset_name='custom', dataset_meta=None, st
                 on_extra_argument=ConfigValidator.IGNORE_ON_EXTRA_ARGUMENT
             )
             postprocessor_config.validate(config)
-            postprocessor = Postprocessor.provide(config['type'], config, config['type'], self.dataset_meta, state)
-            self._processors.append(postprocessor)
-
-        allow_image_postprocessor = True
-        for processor in self._processors:
-            if overrides(processor, 'process_all', Postprocessor):
-                allow_image_postprocessor = False
-                self._dataset_processors.append(processor)
-            else:
-                if allow_image_postprocessor:
-                    self._image_processors.append(processor)
-                else:
-                    self._dataset_processors.append(processor)
+            self.register_postprocessor(config)
 
     def process_dataset(self, annotations, predictions):
         for method in self._dataset_processors:
@@ -79,6 +69,10 @@ def full_process(self, annotations, predictions, metas=None):
     def has_dataset_processors(self):
         return len(self._dataset_processors) != 0
 
+    @property
+    def has_processors(self):
+        return len(self._image_processors) + len(self._dataset_processors) != 0
+
     def __call__(self, context, *args, **kwargs):
         batch_annotation = context.annotation_batch
         batch_prediction = context.prediction_batch
@@ -87,6 +81,18 @@ def __call__(self, context, *args, **kwargs):
                                                                                 batch_prediction,
                                                                                 batch_meta)
 
+    def register_postprocessor(self, config):
+        postprocessor = Postprocessor.provide(config['type'], config, config['type'], self.dataset_meta, self.state)
+        self._processors.append(postprocessor)
+        if overrides(postprocessor, 'process_all', Postprocessor):
+            self.allow_image_postprocessor = False
+            self._dataset_processors.append(postprocessor)
+            return
+        if self.allow_image_postprocessor:
+            self._image_processors.append(postprocessor)
+        else:
+            self._dataset_processors.append(postprocessor)
+
 
 class PostprocessorConfig(ConfigValidator):
     type = StringField(choices=Postprocessor.providers)
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessor.py b/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessor.py
index 0f3ca6f0756..e2d33ff5562 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessor.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/postprocessor.py
@@ -96,7 +96,7 @@ def process_image_with_metadata(self, annotation, prediction, image_metadata=Non
         return self.process_image(annotation, prediction)
 
     def process(self, annotation, prediction, image_metadata=None):
-        image_size = annotation[0].metadata.get('image_size') if not None in annotation else None
+        image_size = annotation[0].metadata.get('image_size') if None not in annotation else None
         self.image_size = None
         if image_size:
             self.image_size = image_size[0]
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/resample_segmentation_prediction.py b/tools/accuracy_checker/accuracy_checker/postprocessor/resample_segmentation_prediction.py
deleted file mode 100644
index 80e85437a86..00000000000
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/resample_segmentation_prediction.py
+++ /dev/null
@@ -1,64 +0,0 @@
-"""
-Copyright (c) 2019 Intel Corporation
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-"""
-
-import numpy as np
-from scipy.ndimage import interpolation
-from .postprocessor import Postprocessor
-from ..representation import BrainTumorSegmentationPrediction, BrainTumorSegmentationAnnotation
-
-
-def resample(data, shape):
-    if len(data.shape) != len(shape):
-        raise RuntimeError('Dimensions of input array and shape are different. Resampling is impossible.')
-    factor = [float(o) / i for i, o in zip(data.shape, shape)]
-    return interpolation.zoom(data, zoom=factor, order=1)
-
-
-class SegmentationPredictionResample(Postprocessor):
-    __provider__ = "segmentation_prediction_resample"
-
-    prediction_types = (BrainTumorSegmentationPrediction, )
-    annotation_types = (BrainTumorSegmentationAnnotation, )
-
-    def process_image(self, annotation, prediction):
-        if not len(annotation) == len(prediction) == 1:
-            raise RuntimeError('Postprocessor {} does not support multiple annotation and/or prediction.'
-                               .format(self.__provider__))
-
-        if not annotation[0].box:
-            raise ValueError('Postprocessor {} not found bounding box.'.format(self.__provider__))
-
-        annotation_ = annotation[0]
-        prediction_ = prediction[0]
-
-        low = annotation_.box[0, :]
-        high = annotation_.box[1, :]
-        diff = (high - low).astype(np.int32)
-
-        annotation_shape = annotation_.mask.shape
-        prediction_shape = prediction_.mask.shape
-
-        image_shape = annotation_shape[len(annotation_shape)-3:len(annotation_shape)]
-        box_shape = (diff[0], diff[1], diff[2])
-
-        label = np.zeros(shape=(prediction_shape[0],) + image_shape)
-
-        label[:, low[0]:high[0], low[1]:high[1], low[2]:high[2]] = resample(prediction_.mask,
-                                                                            (prediction_shape[0],) + box_shape)
-
-        prediction[0].mask = label
-
-        return annotation, prediction
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/resize_segmentation_mask.py b/tools/accuracy_checker/accuracy_checker/postprocessor/resize_segmentation_mask.py
index 239e6c1171a..3b82d5423d3 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/resize_segmentation_mask.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/resize_segmentation_mask.py
@@ -15,13 +15,17 @@
 """
 
 from functools import singledispatch
-import scipy.misc
 import numpy as np
 
 from ..config import NumberField
 from ..utils import get_size_from_config
 from .postprocessor import PostprocessorWithSpecificTargets
 from ..representation import SegmentationPrediction, SegmentationAnnotation
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
+
 
 class ResizeSegmentationMask(PostprocessorWithSpecificTargets):
     __provider__ = 'resize_segmentation_mask'
@@ -34,19 +38,21 @@ def parameters(cls):
         parameters = super().parameters()
         parameters.update({
             'dst_width': NumberField(
-                value_type=int, optional=True, min_value=1, description="Destination width for box clipping."
+                value_type=int, optional=True, min_value=1, description="Destination width for resize"
             ),
             'dst_height': NumberField(
-                value_type=int, optional=True, min_value=1, description="Destination height for box clipping."
+                value_type=int, optional=True, min_value=1, description="Destination height for resize."
             ),
             'size': NumberField(
                 value_type=int, optional=True, min_value=1,
-                description="Destination size for box clipping for both dimensions."
+                description="Destination size for resize for both dimensions (height and width)."
             )
         })
         return parameters
 
     def configure(self):
+        if Image is None:
+            raise ValueError('{} requires pillow, please install it'.format(self.__provider__))
         self.dst_height, self.dst_width = get_size_from_config(self.config, allow_none=True)
 
     def process_image(self, annotation, prediction):
@@ -61,7 +67,7 @@ def resize_segmentation_mask(entry, height, width):
         def _(entry, height, width):
             entry_mask = []
             for class_mask in entry.mask:
-                resized_mask = scipy.misc.imresize(class_mask, (height, width), 'nearest')
+                resized_mask = self.resize(class_mask, width, height)
                 entry_mask.append(resized_mask)
             entry.mask = np.array(entry_mask)
 
@@ -69,7 +75,7 @@ def _(entry, height, width):
 
         @resize_segmentation_mask.register(SegmentationAnnotation)
         def _(entry, height, width):
-            entry.mask = scipy.misc.imresize(entry.mask, (height, width), 'nearest')
+            entry.mask = self.resize(entry.mask, width, height)
             return entry
 
         for target in annotation:
@@ -79,3 +85,50 @@ def _(entry, height, width):
             resize_segmentation_mask(target, target_height, target_width)
 
         return annotation, prediction
+
+    def _to_image(self, arr):
+        data = np.asarray(arr)
+        if np.iscomplexobj(data):
+            raise ValueError("Cannot convert a complex-valued array.")
+        shape = list(data.shape)
+        if len(shape) == 2:
+            return self._process_2d(data, shape)
+        if len(shape) == 3 and shape[2] in (3, 4):
+            return self._process_3d(data, shape)
+        raise ValueError("'arr' does not have a suitable array shape for any mode.")
+
+    def _process_2d(self, data, shape):
+        height, width = shape
+        bytedata = self._bytescale(data)
+        image = Image.frombytes('L', (width, height), bytedata.tostring())
+
+        return image
+
+    def _process_3d(self, data, shape):
+        bytedata = self._bytescale(data)
+        height, width, channels = shape
+        mode = 'RGB' if channels == 3 else 'RGBA'
+        image = Image.frombytes(mode, (width, height), bytedata.tostring())
+
+        return image
+
+    @staticmethod
+    def _bytescale(data):
+        if data.dtype == np.uint8:
+            return data
+        cmin = data.min()
+        cmax = data.max()
+        cscale = cmax - cmin
+        if cscale == 0:
+            cscale = 1
+
+        scale = float(255) / cscale
+        bytedata = (data - cmin) * scale
+
+        return (bytedata.clip(0, 255) + 0.5).astype(np.uint8)
+
+    def resize(self, mask, width, height):
+        image = self._to_image(mask)
+        image_new = image.resize((width, height), resample=0)
+
+        return np.array(image_new)
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/resize_super_resolution.py b/tools/accuracy_checker/accuracy_checker/postprocessor/resize_super_resolution.py
new file mode 100644
index 00000000000..e4befaf6b46
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/resize_super_resolution.py
@@ -0,0 +1,50 @@
+import numpy as np
+from ..postprocessor import Postprocessor
+from ..representation import SuperResolutionPrediction, SuperResolutionAnnotation
+from ..config import NumberField
+from ..utils import get_size_from_config
+
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
+
+
+class ResizeSuperResolution(Postprocessor):
+    __provider__ = 'resize_super_resolution'
+
+    annotation_types = (SuperResolutionAnnotation, )
+    prediction_types = (SuperResolutionPrediction, )
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'dst_width': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination width for resizing."
+            ),
+            'dst_height': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination height for resizing."
+            ),
+            'size': NumberField(
+                value_type=int, optional=True, min_value=1,
+                description="Destination size for resizing for both dimensions (height, width)."
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        if Image is None:
+            raise ValueError('{} requires pillow, please install it'.format(self.__provider__))
+        self.dst_height, self.dst_width = get_size_from_config(self.config, allow_none=True)
+
+    def process_image(self, annotation, prediction):
+        for annotation_, prediction_ in zip(annotation, prediction):
+            target_height = self.dst_height or annotation_.shape[0]
+            target_width = self.dst_width or annotation_.shape[1]
+            data = Image.fromarray(prediction_.value)
+            data = data.resize((target_width, target_height), Image.BICUBIC)
+            prediction_.value = np.array(data)
+
+        return annotation, prediction
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/translate_3d_poses.py b/tools/accuracy_checker/accuracy_checker/postprocessor/translate_3d_poses.py
new file mode 100644
index 00000000000..5bfdde916c0
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/translate_3d_poses.py
@@ -0,0 +1,35 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from ..representation import PoseEstimation3dAnnotation, PoseEstimation3dPrediction
+from .postprocessor import Postprocessor
+
+
+class Translate3dPoses(Postprocessor):
+    __provider__ = 'translate_3d_poses'
+    annotation_types = (PoseEstimation3dAnnotation,)
+    prediction_types = (PoseEstimation3dPrediction,)
+
+    def process_image(self, annotations, predictions):
+        for batch_id, prediction in enumerate(predictions):
+            for pose_id in range(prediction.size):
+                translation = prediction.translations[pose_id]
+                translation[2] *= annotations[batch_id].fx
+                prediction.x_3d_values[pose_id] += translation[0]
+                prediction.y_3d_values[pose_id] += translation[1]
+                prediction.z_3d_values[pose_id] += translation[2]
+
+        return annotations, predictions
diff --git a/tools/accuracy_checker/accuracy_checker/postprocessor/zoom_segmentation_mask.py b/tools/accuracy_checker/accuracy_checker/postprocessor/zoom_segmentation_mask.py
index 8bc87c85780..5bac25938a3 100644
--- a/tools/accuracy_checker/accuracy_checker/postprocessor/zoom_segmentation_mask.py
+++ b/tools/accuracy_checker/accuracy_checker/postprocessor/zoom_segmentation_mask.py
@@ -21,6 +21,7 @@
 from ..config import NumberField
 from ..logging import warning
 
+
 class ZoomSegMask(Postprocessor):
     """
     Zoom probabilities of segmentation prediction.
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/README.md b/tools/accuracy_checker/accuracy_checker/preprocessor/README.md
index a2929dff680..561ee79d066 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/README.md
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/README.md
@@ -7,7 +7,7 @@ Accuracy Checker supports following set of preprocessors:
 * `resize` - resizing the image to a new width and height.
   * `dst_width` and `dst_height` are destination width and height for image resizing respectively.
     You can also use `size` instead in case when destination sizes are equal for both dimensions.
-  * `resize_realization` - parameter specifies functionality of which library will be used for resize: `opencv`, `pillow` or `tf` (default `opencv` is used). For enabling `tf` you need to install Tensorflow first.
+  * `resize_realization` - parameter specifies functionality of which library will be used for resize: `opencv`, `pillow` or `tf` (default `opencv` is used). For enabling `tf` you need to install TensorFlow first.
   For compatibility with previous releases you can also use boolean constants for selection resizing backend:
     * `use_pillow` parameter specifies usage of Pillow library for resizing.
     * `use_tensorflow` parameter specifies usage of TensorFlow Image for resizing. Requires TensorFlow installation.
@@ -40,11 +40,27 @@ Accuracy Checker supports following set of preprocessors:
      You can specify one value for all channels or list of comma separated channel-wise values.
   * `std` specifies values, on which pixels will be divided.
      You can specify one value for all channels or list of comma separated channel-wise values.
-
      These parameters support work with precomputed values of frequently used datasets (e.g. `cifar10` or `imagenet`).
-
+* `resize3d` - resizing 3d image (e.g. MRI scans) to new size:
+  * `size` in format `(H,W,D)`. All values will be interpolated with 1st-order spline.
+* `crop_brats`  -  performing crop of 3d images (e.g. MRI scans) by cropping all non-zero voxels. Also sets bounding boxes for `segmentation_prediction_resample` preprocessor (see [Postprocessors](../postprocessor/README.md))
+* `normalize_brats` - normalization of 3d images (e.g. MRI scans) with z-score normalization
+  * `masked` - specifies type of masking:
+    * `none` for not applying mask
+    * `ignore` for ignoring "empty" voxels in statistic calculation
+    * `nullify` for nullifying initially "empty" voxels at the end
+    * `all` for `ignore` and `nullify`
+  * `cutoff` - cuts minimum and value to `-cutoff` and `cutoff` respectively
+  * `shift_value` - adds to all values
+  * `normalize_value` - divides all values
+* `swap_modalities` - swapping modalities of MRI scan (works as channel swapping)
+  * `modality_order` - new order
 * `bgr_to_rgb` - reversing image channels. Convert image in BGR format to RGB.
-* `bgr_to_gray` - converting image in BGR to grayscale color space.
+* `bgr_to_gray` - converting image in BGR to gray scale color space.
+* `rgb_to_bgr` - reversing image channels. Convert image in RGB format to BGR.
+* `rgb_to_gray` - converting image in RGB to gray scale color space.
+* `select_channel` - select channel only one specified channel from multichannel image.
+  * `channel` - channel id in image (e.g. if you read image in RGB and want to select green channel, you need to specify 1 as channel)
 * `flip` - image mirroring around specified axis.
   * `mode` specifies the axis for flipping (`vertical` or `horizontal`).
 * `crop` - central cropping for image.
@@ -73,11 +89,13 @@ Accuracy Checker supports following set of preprocessors:
   * `dst_width`, `dst_height` and `dst_volume` are destination width, height and volume for cropped 3D-image respectively.
     You can also use `size` instead in case when destination sizes are equal for all three dimensions.
 * `normalize3d` - normalizing 3D-images using mean and std values per channel of current image for subtraction and division respectively.
-* `tf_convert_image_dtype` - cast image values to floating point values in range [0, 1]. Requires Tensorflow installation.
+* `tf_convert_image_dtype` - cast image values to floating point values in range [0, 1]. Requires TensorFlow installation.
 * `decode_by_vocabulary` - Decode words to set of indexes using model vocab.
   * `vocabulary_file` - path to vocabulary file for decoding. Path can be prefixed with `--models` argument.
   * `unk_index` - index of unknown symbol in vocab.
 *  `pad_with_eos` - supplement the input sequence to a specific size using a line terminator character or index.
   * `eos_symbol` or `eos_index` - line terminator symbol or index of this symbol in vocab for encoded sequence respectively.
   *  `sequence_len` - length of sequence after supplement.
-
+* `centernet_affine_transform` - CenterNet affine transformation, used for image resizing.
+  * `dst_width` and `dst_height` are destination width, and height for image. You can also use size instead in case when destination sizes are equal.
+  * `scale` - scale factor for image (default is 1).
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/__init__.py b/tools/accuracy_checker/accuracy_checker/preprocessor/__init__.py
index df6fcf598fb..ee0e4cea27c 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/__init__.py
@@ -16,21 +16,24 @@
 
 from .preprocessing_executor import PreprocessingExecutor
 from .preprocessor import Preprocessor
-from .color_spece_conversion import BgrToRgb, BgrToGray, TfConvertImageDType
+from .color_space_conversion import BgrToRgb, RgbToBgr, BgrToGray, RgbToGray, TfConvertImageDType, SelectInputChannel
 from .normalization import Normalize, Normalize3d
 from .geometric_transformations import (
     GeometricOperationMetadata,
-    Resize,
-    AutoResize,
     Flip,
     Crop,
     CropRect,
     ExtendAroundRect,
     PointAligner,
     Tiling,
-    Crop3D
+    Crop3D,
+    TransformedCropWithAutoScale,
+    ImagePyramid
 )
+from .resize import Resize, AutoResize
 from .nlp_preprocessors import DecodeByVocabulary, PadWithEOS
+from .centernet_preprocessing import CenterNetAffineTransformation
+from .brats_preprocessing import Resize3D, NormalizeBrats, CropBraTS, SwapModalitiesBrats
 
 __all__ = [
     'PreprocessingExecutor',
@@ -39,6 +42,7 @@
     'GeometricOperationMetadata',
 
     'Resize',
+    'Resize3D',
     'AutoResize',
     'Flip',
     'Crop',
@@ -47,14 +51,25 @@
     'PointAligner',
     'Tiling',
     'Crop3D',
+    'CropBraTS',
+    'TransformedCropWithAutoScale',
+    'ImagePyramid',
 
     'BgrToGray',
     'BgrToRgb',
+    'RgbToGray',
+    'RgbToBgr',
     'TfConvertImageDType',
+    'SelectInputChannel',
 
     'Normalize3d',
     'Normalize',
+    'NormalizeBrats',
+
+    'SwapModalitiesBrats',
 
     'DecodeByVocabulary',
-    'PadWithEOS'
+    'PadWithEOS',
+
+    'CenterNetAffineTransformation'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/brats_preprocessing.py b/tools/accuracy_checker/accuracy_checker/preprocessor/brats_preprocessing.py
new file mode 100644
index 00000000000..2b121528333
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/brats_preprocessing.py
@@ -0,0 +1,200 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import numpy as np
+
+from ..config import ConfigError, BaseField, NumberField, ListField, StringField
+from ..preprocessor import Preprocessor
+from ..utils import get_or_parse_value
+
+try:
+    from scipy.ndimage import interpolation
+except ImportError:
+    interpolation = None
+
+
+class Resize3D(Preprocessor):
+    __provider__ = 'resize3d'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'size': BaseField(optional=True, description='Specifies resize'),
+        })
+        return parameters
+
+    def configure(self):
+        if interpolation is None:
+            raise ValueError('resize3d require scipy, please install it before usage.')
+
+        self.shape = self._check_size(
+            get_or_parse_value(self.config.get('size'), default=(128, 128, 128), casting_type=int))
+
+    def process(self, image, annotation_meta=None):
+        data = np.asarray(image.data)
+        shape = self.shape if len(data.shape) == 3 else (data.shape[0],) + self.shape
+        if len(data.shape) != len(shape):
+            raise RuntimeError('Shape of original data and resize shape are mismatched for {} preprocessor '
+                               '(data shape - {}, resize shape - {})'.format(self.__provider__, data.shape, shape))
+
+        factor = [float(o) / i for i, o in zip(data.shape, shape)]
+        image.data = interpolation.zoom(data, zoom=factor, order=1)
+
+        return image
+
+    def _check_size(self, size):
+        if len(size) != 3:
+            raise ConfigError("Incorrect size dimenstion for {} - must be 3, but {} found"
+                              .format(self.__provider__, len(size)))
+        if not all(np.array(size) > 0):
+            raise ConfigError("Size must be positive value for {}, but {} found".format(self.__provider__, size))
+        return size
+
+
+class CropBraTS(Preprocessor):
+    __provider__ = 'crop_brats'
+
+    def process(self, image, annotation_meta=None):
+        def bbox3(img):
+            # Finds indexes non-zero voxels across axis 0, 1 and 2 correspondenly
+            nonzero_across_axis_0 = np.any(img, axis=(1, 2)).nonzero()
+            nonzero_across_axis_1 = np.any(img, axis=(0, 2)).nonzero()
+            nonzero_across_axis_2 = np.any(img, axis=(0, 1)).nonzero()
+
+            nonzero_across_axis_0 = nonzero_across_axis_0[0]
+            nonzero_across_axis_1 = nonzero_across_axis_1[0]
+            nonzero_across_axis_2 = nonzero_across_axis_2[0]
+
+            # If any axis contains only zero voxels than image is blank
+            bbox = np.array([[-1, -1, -1], [0, 0, 0]])
+            if nonzero_across_axis_0.size == 0:
+                return bbox
+
+            bbox[:, 0] = nonzero_across_axis_0[[0, -1]]
+            bbox[:, 1] = nonzero_across_axis_1[[0, -1]]
+            bbox[:, 2] = nonzero_across_axis_2[[0, -1]]
+
+            return bbox
+
+        bboxes = np.zeros((image.data.shape[0],) + (2, 3))
+        for i in range(image.data.shape[0]):
+            bboxes[i] = bbox3(image.data[i, :, :, :])
+
+        bbox_min = np.min(bboxes[:, 0, :], axis=0).ravel().astype(int)
+        bbox_max = np.max(bboxes[:, 1, :], axis=0).ravel().astype(int)
+        bbox = np.zeros((2, 3), dtype=int)
+        bbox[0] = bbox_min
+        bbox[1] = bbox_max
+
+        image.data = image.data[:, bbox[0, 0]:bbox[1, 0], bbox[0, 1]:bbox[1, 1], bbox[0, 2]:bbox[1, 2]]
+
+        image.metadata['box'] = bbox
+
+        return image
+
+
+class NormalizeBrats(Preprocessor):
+    __provider__ = "normalize_brats"
+
+    _MASK_OPTIONS = {
+        'none': 0,
+        'nullify': 1,
+        'ignore': 2,
+        'all': 3,
+    }
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'masked': StringField(optional=True, choices=NormalizeBrats._MASK_OPTIONS.keys(),
+                                  default=False,
+                                  description='Does not apply normalization to zero values. '
+                                              'Applicable for brain tumor segmentation models'),
+            'cutoff': NumberField(optional=True, default=0, min_value=0,
+                                  description='Species range of values - [-cutoff, cutoff]'),
+            'shift_value': NumberField(optional=True, default=0, description='Specifies shift value'),
+            'normalize_value': NumberField(optional=True, default=1, description='Specifies normalize value')
+        })
+
+        return parameters
+
+    def configure(self):
+        self.masked = NormalizeBrats._MASK_OPTIONS[self.get_value_from_config('masked')]
+        self.cutoff = self.get_value_from_config('cutoff')
+        self.shift_value = self.get_value_from_config('shift_value')
+        self.normalize_value = self.get_value_from_config('normalize_value')
+
+    def process(self, image, annotation_meta=None):
+        image.data = self.normalize_img(image.data)
+        return image
+
+    def normalize_img(self, image):
+        for channel in range(image.shape[0]):
+            img = image[channel, :, :, :].copy()
+            if self.masked in (2, 3):
+                mask = img > 0
+                image_masked = np.ma.masked_array(img, ~mask)
+                mean, std = np.mean(image_masked), np.std(image_masked)
+            else:
+                mean, std = np.mean(img), np.std(img)
+
+            img -= mean
+            img /= std
+
+            if self.cutoff > 0:
+                img = np.clip(img, -self.cutoff, self.cutoff) # pylint: disable=E1130
+            img += self.shift_value
+            img /= self.normalize_value
+            if self.masked in (1, 3):
+                mask = image[channel, :, :, :] > 0
+                img[~mask] = 0
+            image[channel, :, :, :] = img
+
+        return image
+
+
+class SwapModalitiesBrats(Preprocessor):
+    __provider__ = 'swap_modalities'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'modality_order': ListField(value_type=NumberField(value_type=int, min_value=0, max_value=3),
+                                        validate_values=True,
+                                        description="Specifies order of modality according to model input")
+        })
+
+        return parameters
+
+    def configure(self):
+        self.modal_order = self.get_value_from_config('modality_order')
+        if len(self.modal_order) != 4:
+            raise ConfigError('{} supports only 4 modality, but found {}'
+                              .format(self.__provider__, len(self.modal_order)))
+        if len(self.modal_order) != len(set(self.modal_order)):
+            raise ConfigError('Incorrect modality index found in {} for {}. Indexes must be unique'
+                              .format(self.modal_order, self.__provider__))
+
+    def process(self, image, annotation_meta=None):
+        image.data = self.swap_modalities(image.data)
+        return image
+
+    def swap_modalities(self, image):
+        image = image[self.modal_order, :, :, :]
+        return image
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/centernet_preprocessing.py b/tools/accuracy_checker/accuracy_checker/preprocessor/centernet_preprocessing.py
new file mode 100644
index 00000000000..13ea8c8f286
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/centernet_preprocessing.py
@@ -0,0 +1,108 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import cv2
+import numpy as np
+
+from ..config import NumberField
+from ..preprocessor import Preprocessor
+from ..utils import get_size_from_config
+
+
+class CenterNetAffineTransformation(Preprocessor):
+    __provider__ = 'centernet_affine_transform'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'size': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination size for image."
+            ),
+            'dst_width': NumberField(
+                value_type=int, optional=False, min_value=1, description="Destination width for image."
+            ),
+            'dst_height': NumberField(
+                value_type=int, optional=False, min_value=1, description="Destination height for image."
+            ),
+            'scale': NumberField(
+                value_type=int, optional=True, default=1,
+                description="Scale for input image"
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        self.input_height, self.input_width = get_size_from_config(self.config)
+        self.scale = self.get_value_from_config('scale')
+
+    @staticmethod
+    def get_affine_transform(center, scale, rot, output_size, inv=0):
+
+        def get_dir(src_point, rot_rad):
+            sn, cs = np.sin(rot_rad), np.cos(rot_rad)
+            src_result = [0, 0]
+            src_result[0] = src_point[0] * cs - src_point[1] * sn
+            src_result[1] = src_point[0] * sn + src_point[1] * cs
+            return src_result
+
+        def get_3rd_point(a, b):
+            direct = a - b
+            return b + np.array([-direct[1], direct[0]], dtype=np.float32)
+
+        if not isinstance(scale, np.ndarray) and not isinstance(scale, list):
+            scale = np.array([scale, scale], dtype=np.float32)
+
+        scale_tmp = scale
+        src_w = scale_tmp[0]
+        dst_w, dst_h = output_size
+
+        rot_rad = np.pi * rot / 180
+        src_dir = get_dir([0, src_w * -0.5], rot_rad)
+        dst_dir = np.array([0, dst_w * -0.5], dtype=np.float32)
+
+        dst = np.zeros((3, 2), dtype=np.float32)
+        src = np.zeros((3, 2), dtype=np.float32)
+        src[0, :], src[1, :] = center, center + src_dir
+        dst[0, :] = [dst_w * 0.5, dst_h * 0.5]
+        dst[1, :] = np.array([dst_w * 0.5, dst_h * 0.5], np.float32) + dst_dir
+        src[2:, :] = get_3rd_point(src[0, :], src[1, :])
+        dst[2:, :] = get_3rd_point(dst[0, :], dst[1, :])
+
+        if inv:
+            trans = cv2.getAffineTransform(np.float32(dst), np.float32(src))
+        else:
+            trans = cv2.getAffineTransform(np.float32(src), np.float32(dst))
+
+        return trans
+
+    def process(self, image, annotation_meta=None):
+        data = image.data
+        height, width = data.shape[0:2]
+        new_height = height * self.scale
+        new_width = width * self.scale
+        center = np.array([new_width / 2., new_height / 2.], dtype=np.float32)
+        scale = max(height, width) * 1.0
+
+        trans_input = self.get_affine_transform(center, scale, 0, [self.input_width, self.input_height])
+        resized_image = cv2.resize(data, (new_width, new_height))
+        inp_image = cv2.warpAffine(
+            resized_image, trans_input, (self.input_width, self.input_height),
+            flags=cv2.INTER_LINEAR)
+
+        image.data = inp_image
+        return image
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/color_spece_conversion.py b/tools/accuracy_checker/accuracy_checker/preprocessor/color_space_conversion.py
similarity index 53%
rename from tools/accuracy_checker/accuracy_checker/preprocessor/color_spece_conversion.py
rename to tools/accuracy_checker/accuracy_checker/preprocessor/color_space_conversion.py
index 428e9e45e40..2fdf4eea47c 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/color_spece_conversion.py
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/color_space_conversion.py
@@ -17,6 +17,12 @@
 
 import cv2
 import numpy as np
+from ..config import NumberField
+
+try:
+    import tensorflow as tf
+except ImportError as import_error:
+    tf = None
 
 from .preprocessor import Preprocessor
 
@@ -40,18 +46,33 @@ def process(self, image, annotation_meta=None):
         image.data = np.expand_dims(cv2.cvtColor(image.data, cv2.COLOR_BGR2GRAY).astype(np.float32), -1)
         return image
 
+class RgbToBgr(Preprocessor):
+    __provider__ = 'rgb_to_bgr'
+
+    def process(self, image, annotation_meta=None):
+        def process_data(data):
+            return cv2.cvtColor(data, cv2.COLOR_RGB2BGR)
+        image.data = process_data(image.data) if not isinstance(image.data, list) else [
+            process_data(fragment) for fragment in image.data
+        ]
+        return image
+
+
+class RgbToGray(Preprocessor):
+    __provider__ = 'rgb_to_gray'
+
+    def process(self, image, annotation_meta=None):
+        image.data = np.expand_dims(cv2.cvtColor(image.data, cv2.COLOR_RGB2GRAY).astype(np.float32), -1)
+        return image
+
 
 class TfConvertImageDType(Preprocessor):
     __provider__ = 'tf_convert_image_dtype'
 
     def __init__(self, config, name, input_shapes=None):
         super().__init__(config, name, input_shapes)
-        try:
-            import tensorflow as tf
-        except ImportError as import_error:
-            raise ImportError(
-                'tf_convert_image_dtype disabled.Please, install Tensorflow before using. \n{}'.format(import_error.msg)
-            )
+        if tf is None:
+            raise ImportError('*tf_convert_image_dtype* operation requires TensorFlow. Please install it before usage')
         tf.enable_eager_execution()
         self.converter = tf.image.convert_image_dtype
         self.dtype = tf.float32
@@ -61,3 +82,27 @@ def process(self, image, annotation_meta=None):
         image.data = converted_data.numpy()
 
         return image
+
+
+class SelectInputChannel(Preprocessor):
+    __provider__ = 'select_channel'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters['channel'] = NumberField(value_type=int, min_value=0)
+        return parameters
+
+    def configure(self):
+        self.channel = self.get_value_from_config('channel')
+
+    def process(self, image, annotation_meta=None):
+        def process_data(data):
+            return data[:, :, self.channel, np.newaxis]
+
+        if isinstance(image.data, list):
+            image.data = [process_data(item) for item in image.data]
+        else:
+            image.data = process_data(image.data)
+
+        return image
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/geometric_transformations.py b/tools/accuracy_checker/accuracy_checker/preprocessor/geometric_transformations.py
index ee117594239..7a1dc33772a 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/geometric_transformations.py
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/geometric_transformations.py
@@ -19,351 +19,19 @@
 
 import cv2
 import numpy as np
-from PIL import Image
 
 from ..config import ConfigError, NumberField, StringField, BoolField
-from ..dependency import ClassProvider
-from ..logging import warning
 from ..preprocessor import Preprocessor
-from ..utils import contains_all, get_size_from_config, string_to_tuple, get_size_3d_from_config
+from ..utils import get_size_from_config, string_to_tuple, get_size_3d_from_config
 
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
 
 # The field .type should be string, the field .parameters should be dict
 GeometricOperationMetadata = namedtuple('GeometricOperationMetadata', ['type', 'parameters'])
 
-
-def scale_width(dst_width, dst_height, image_width, image_height,):
-    return int(dst_width * image_width / image_height), dst_height
-
-
-def scale_height(dst_width, dst_height, image_width, image_height):
-    return dst_width, int(dst_height * image_height / image_width)
-
-
-def scale_greater(dst_width, dst_height, image_width, image_height):
-    if image_height > image_width:
-        return scale_height(dst_width, dst_height, image_width, image_height)
-    return scale_width(dst_width, dst_height, image_width, image_height)
-
-
-def scale_fit_to_window(dst_width, dst_height, image_width, image_height):
-    im_scale = min(dst_height / image_height, dst_width / image_width)
-    return int(im_scale * image_width), int(im_scale * image_height)
-
-
-def frcnn_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
-    min_size = min(dst_width, dst_height)
-    max_size = max(dst_width, dst_height)
-    w1, h1 = scale_greater(min_size, min_size, image_width, image_height)
-    if max(w1, h1) <= max_size:
-        return w1, h1
-
-    return scale_fit_to_window(max_size, max_size, image_width, image_height)
-
-
-def ctpn_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
-    scale = min(dst_height, dst_width)
-    max_scale = max(dst_height, dst_width)
-    im_min_size = min(image_width, image_height)
-    im_max_size = max(image_width, image_height)
-    im_scale = float(scale) / float(im_min_size)
-    if np.round(im_scale * im_max_size) > max_scale:
-        im_scale = float(max_scale) / float(im_max_size)
-    new_h = np.round(image_height * im_scale)
-    new_w = np.round(image_width * im_scale)
-    return int(new_w), int(new_h)
-
-
-def east_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
-    resize_w = image_width
-    resize_h = image_height
-    max_side_len = max(dst_width, dst_height)
-    min_side_len = min(dst_width, dst_height)
-
-    # limit the max side
-    if max(resize_h, resize_w) > max_side_len:
-        ratio = float(max_side_len) / resize_h if resize_h > resize_w else float(max_side_len) / resize_w
-    else:
-        ratio = 1.
-    resize_h = int(resize_h * ratio)
-    resize_w = int(resize_w * ratio)
-
-    resize_h = resize_h if resize_h % min_side_len == 0 else (resize_h // min_side_len - 1) * min_side_len
-    resize_w = resize_w if resize_w % min_side_len == 0 else (resize_w // min_side_len - 1) * min_side_len
-    resize_h = max(32, resize_h)
-    resize_w = max(32, resize_w)
-
-    return resize_w, resize_h
-
-
-ASPECT_RATIO_SCALE = {
-    'width': scale_width,
-    'height': scale_height,
-    'greater': scale_greater,
-    'fit_to_window': scale_fit_to_window,
-    'frcnn_keep_aspect_ratio': frcnn_keep_aspect_ratio,
-    'ctpn_keep_aspect_ratio': ctpn_keep_aspect_ratio,
-    'east_keep_aspect_ratio': east_keep_aspect_ratio
-}
-
-
-class _Resizer(ClassProvider):
-    __provider_type__ = 'resizer'
-
-    supported_interpolations = {}
-    default_interpolation = None
-
-    def __init__(self, interpolation=None):
-        if not interpolation:
-            interpolation = self.default_interpolation
-        if interpolation.upper() not in self.supported_interpolations:
-            raise ConfigError('{} not found for {}'.format(self.supported_interpolations, self.__provider__))
-        self.interpolation = self.supported_interpolations.get(interpolation.upper(), self.default_interpolation)
-
-    def resize(self, data, new_height, new_width):
-        raise NotImplementedError
-
-    def __call__(self, data, new_height, new_width):
-        return self.resize(data, new_height, new_width)
-
-    @classmethod
-    def all_provided_interpolations(cls):
-        interpolations = set()
-        for _, provider_class in cls.providers.items():
-            try:
-                interpolations.update(provider_class.supported_interpolations)
-            except ImportError:
-                continue
-        return interpolations
-
-
-class _OpenCVResizer(_Resizer):
-    __provider__ = 'opencv'
-
-    supported_interpolations = {
-        'NEAREST': cv2.INTER_NEAREST,
-        'LINEAR': cv2.INTER_LINEAR,
-        'CUBIC': cv2.INTER_CUBIC,
-        'AREA': cv2.INTER_AREA,
-        'MAX': cv2.INTER_MAX,
-        'BITS': cv2.INTER_BITS,
-        'BITS2': cv2.INTER_BITS2,
-        'LANCZOS4': cv2.INTER_LANCZOS4,
-    }
-    default_interpolation = 'LINEAR'
-
-    def resize(self, data, new_height, new_width):
-        return cv2.resize(data, (new_width, new_height), interpolation=self.interpolation).astype(np.float32)
-
-
-class _PillowResizer(_Resizer):
-    __provider__ = 'pillow'
-
-    supported_interpolations = {
-        'NEAREST': Image.NEAREST,
-        'NONE': Image.NONE,
-        'BOX': Image.BOX,
-        'BILINEAR': Image.BILINEAR,
-        'LINEAR': Image.LINEAR,
-        'HAMMING': Image.HAMMING,
-        'BICUBIC': Image.BICUBIC,
-        'CUBIC': Image.CUBIC,
-        'LANCZOS': Image.LANCZOS,
-        'ANTIALIAS': Image.ANTIALIAS
-    }
-    default_interpolation = 'BILINEAR'
-
-    def resize(self, data, new_height, new_width):
-        data = Image.fromarray(data)
-        data = data.resize((new_width, new_height), self.interpolation)
-        data = np.array(data)
-
-        return data
-
-
-class _TFResizer(_Resizer):
-    __provider__ = 'tf'
-
-    def __init__(self, interpolation):
-        try:
-            import tensorflow as tf
-        except ImportError as import_error:
-            raise ImportError(
-                'tf resize disabled. Please, install Tensorflow before using. \n{}'.format(import_error.msg)
-            )
-        tf.enable_eager_execution()
-        self.supported_interpolations = {
-            'BILINEAR': tf.image.ResizeMethod.BILINEAR,
-            'AREA': tf.image.ResizeMethod.AREA,
-            'BICUBIC': tf.image.ResizeMethod.BICUBIC,
-        }
-        self.default_interpolation = 'BILINEAR'
-        self._resize = tf.image.resize_images
-
-        super().__init__(interpolation)
-
-    def resize(self, data, new_height, new_width):
-        resized_data = self._resize(data, [new_height, new_width], method=self.interpolation)
-        return resized_data.numpy()
-
-
-def create_resizer(config):
-    resize_realization = config.get('resize_realization')
-    interpolation = config.get('interpolation')
-
-    def provided_both_resizer(additional_flag):
-        return contains_all(config, ['resize_realization', additional_flag])
-
-    def select_resizer_by_flags(use_pil, use_tf):
-        if use_pil and use_tf:
-            raise ConfigError('Pillow and TensorFlow flags both provided. Please select only one resize method.')
-        if use_pil:
-            return 'pillow'
-        if use_tf:
-            return 'tf'
-        return 'opencv'
-
-    if resize_realization:
-        if provided_both_resizer('use_pillow') or provided_both_resizer('use_tensorflow'):
-            warning(
-                'resize_realization and flag: {} both provided. resize_realization: {} will be used.'.format(
-                    'use_pillow' if 'use_pillow' in config else 'use_tensorflow', config['resize_realization']
-                )
-            )
-    else:
-        use_pillow, use_tesorfow = config.get('use_pillow', False), config.get('use_tensorflow', False)
-        resize_realization = select_resizer_by_flags(use_pillow, use_tesorfow)
-
-    return _Resizer.provide(resize_realization, interpolation)
-
-
-class Resize(Preprocessor):
-    __provider__ = 'resize'
-
-    @classmethod
-    def parameters(cls):
-        parameters = super().parameters()
-        parameters.update({
-            'size': NumberField(
-                value_type=int, optional=True, min_value=1, description="Destination sizes for both dimensions."
-            ),
-            'dst_width': NumberField(
-                value_type=int, optional=True, min_value=1, description="Destination width for image resizing."
-            ),
-            'dst_height': NumberField(
-                value_type=int, optional=True, min_value=1, description="Destination height for image resizing."
-            ),
-            'aspect_ratio_scale': StringField(
-                choices=ASPECT_RATIO_SCALE, optional=True,
-                description="Allows save image aspect ratio using one of these ways: "
-                            "{}".format(', '.join(ASPECT_RATIO_SCALE))
-            ),
-            'interpolation': StringField(
-                choices=_Resizer.all_provided_interpolations(), optional=True, default='LINEAR',
-                description="Specifies method that will be used."
-            ),
-            'use_pillow': BoolField(
-                optional=True, default=False,
-                description="Parameter specifies usage of Pillow library for resizing."
-            ),
-            'use_tensorflow': BoolField(
-                optional=True,
-                description="Specifies usage of TensorFlow Image for resizing. Requires TensorFlow installation."
-            ),
-            'resize_realization': StringField(
-                optional=True, choices=_Resizer.providers,
-                description="Parameter specifies functionality of which library will be used for resize: "
-                            "{}".format(', '.join(_Resizer.providers))
-            )
-        })
-
-        return parameters
-
-    def configure(self):
-        self.dst_height, self.dst_width = get_size_from_config(self.config)
-        self.resizer = create_resizer(self.config)
-        self.scaling_func = ASPECT_RATIO_SCALE.get(self.get_value_from_config('aspect_ratio_scale'))
-
-    def process(self, image, annotation_meta=None):
-        data = image.data
-        new_height, new_width = self.dst_height, self.dst_width
-
-        is_simple_case = not isinstance(data, list) # otherwise -- pyramid, tiling, etc
-
-        def process_data(data, new_height, new_width, scale_func, resize_func):
-            dst_width, dst_height = new_width, new_height
-            image_h, image_w = data.shape[:2]
-            if scale_func:
-                dst_width, dst_height = scale_func(new_width, new_height, image_w, image_h)
-
-            resize_meta = {}
-            resize_meta['preferable_width'] = max(dst_width, new_width)
-            resize_meta['preferable_height'] = max(dst_height, new_height)
-            resize_meta['image_info'] = [dst_height, dst_width, 1]
-            resize_meta['scale_x'] = float(dst_width) / image_w
-            resize_meta['scale_y'] = float(dst_height) / image_h
-            resize_meta['original_width'] = image_w
-            resize_meta['original_height'] = image_h
-
-            if is_simple_case:
-                # support GeometricOperationMetadata array for simple case only -- without tiling, pyramids, etc
-                image.metadata.setdefault(
-                    'geometric_operations', []).append(GeometricOperationMetadata('resize', resize_meta))
-
-            image.metadata.update(resize_meta)
-
-            data = resize_func(data, dst_height, dst_width)
-            if len(data.shape) == 2:
-                data = np.expand_dims(data, axis=-1)
-
-            return data
-
-        image.data = (
-            process_data(data, new_height, new_width, self.scaling_func, self.resizer)
-            if is_simple_case else [
-                process_data(data_fragment, new_height, new_width, self.scaling_func, self.resizer)
-                for data_fragment in data
-            ]
-        )
-
-        return image
-
-
-class AutoResize(Preprocessor):
-    __provider__ = 'auto_resize'
-
-    def configure(self):
-        if self.input_shapes is None or len(self.input_shapes) != 1:
-            raise ConfigError('resize to input size possible, only for one input layer case')
-        input_shape = next(iter(self.input_shapes.values()))
-        self.dst_height, self.dst_width = input_shape[2:]
-
-    def process(self, image, annotation_meta=None):
-        is_simple_case = not isinstance(image.data, list) # otherwise -- pyramid, tiling, etc
-
-        def process_data(data):
-            data = cv2.resize(data, (self.dst_width, self.dst_height)).astype(np.float32)
-            if len(data.shape) == 2:
-                data = np.expand_dims(data, axis=-1)
-
-            if is_simple_case:
-                # support GeometricOperationMetadata array for simple case only -- without tiling, pyramids, etc
-                image.metadata.setdefault('geometric_operations', []).append(
-                    GeometricOperationMetadata('auto_resize', {})
-                )
-
-            return data
-
-        data = image.data
-        image.data = (
-            process_data(data) if is_simple_case else [
-                process_data(data_fragment)for data_fragment in data
-            ]
-        )
-
-        return image
-
-
 FLIP_MODES = {'horizontal': 0, 'vertical': 1}
 
 
@@ -374,8 +42,10 @@ class Flip(Preprocessor):
     def parameters(cls):
         parameters = super().parameters()
         parameters.update({
-            'mode' : StringField(choices=FLIP_MODES.keys(), default='horizontal',
-                                 description="Specifies the axis for flipping (vertical or horizontal).")
+            'mode': StringField(
+                choices=FLIP_MODES.keys(), default='horizontal',
+                description="Specifies the axis for flipping (vertical or horizontal)."
+            )
         })
         return parameters
 
@@ -422,6 +92,10 @@ def parameters(cls):
 
     def configure(self):
         self.use_pillow = self.get_value_from_config('use_pillow')
+        if self.use_pillow and Image is None:
+            raise ValueError(
+                'Crop operation with pillow backend, requires Pillow. Please install it or select default backend'
+            )
         self.dst_height, self.dst_width = get_size_from_config(self.config, allow_none=True)
         self.central_fraction = self.get_value_from_config('central_fraction')
         if self.dst_height is None and self.dst_width is None and self.central_fraction is None:
@@ -637,11 +311,11 @@ def align(self, img, points):
 
     @staticmethod
     def transformation_from_points(points1, points2):
-        points1 = np.matrix(points1.astype(np.float64))
-        points2 = np.matrix(points2.astype(np.float64))
+        points1 = points1.astype(np.float64)
+        points2 = points2.astype(np.float64)
 
-        c1 = np.mean(points1, axis=0)
-        c2 = np.mean(points2, axis=0)
+        c1 = np.mean(points1, axis=0, keepdims=True)
+        c2 = np.mean(points2, axis=0, keepdims=True)
         points1 -= c1
         points2 -= c2
         s1 = np.std(points1)
@@ -650,10 +324,10 @@ def transformation_from_points(points1, points2):
         points2 /= np.maximum(s1, np.finfo(np.float64).eps)
         points_std_ratio = s2 / np.maximum(s1, np.finfo(np.float64).eps)
 
-        u, _, vt = np.linalg.svd(points1.T * points2)
-        r = (u * vt).T
+        u, _, vt = np.linalg.svd(points1.T @ points2)
+        r = (u @ vt).T
 
-        return np.hstack((points_std_ratio * r, c2.T - points_std_ratio * r * c1.T))
+        return np.hstack((points_std_ratio * r, c2.T - points_std_ratio * r @ c1.T))
 
 
 def center_padding(dst_width, dst_height, width, height):
@@ -865,3 +539,125 @@ def crop_center(img, cropx, cropy, cropz):
         endz = min(startz + cropz, z)
 
         return img[startz:endz, starty:endy, startx:endx, :]
+
+
+class TransformedCropWithAutoScale(Preprocessor):
+    __provider__ = 'transformed_crop_with_auto_scale'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'size': NumberField(
+                value_type=int, optional=True, min_value=1,
+                description="Destination sizes for both dimensions of heatmaps output."
+            ),
+            'dst_width': NumberField(
+                value_type=int, optional=True, min_value=1, description="Width of heatmaps output."
+            ),
+            'dst_height': NumberField(
+                value_type=int, optional=True, min_value=1, description="Height of heatmaps output."
+            ),
+            'stride': NumberField(
+                value_type=int, optional=False,
+                description="Stride for network. It is input size of heatmaps / output size of heatmaps."
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        self.input_height, self.input_width = get_size_from_config(self.config)
+        self.stride = self.get_value_from_config('stride')
+
+    def process(self, image, annotation_meta=None):
+        data = image.data
+        center, scale = self.get_center_scale(annotation_meta['rects'][0], data.shape[1], data.shape[0])
+        trans = self.get_transformation_matrix(center, scale, [self.input_width, self.input_height])
+        rev_trans = self.get_transformation_matrix(center, scale, [self.input_width // self.stride,
+                                                                   self.input_height // self.stride], key=1)
+        data = cv2.warpAffine(data, trans, (self.input_width, self.input_height), flags=cv2.INTER_LINEAR)
+        image.data = data
+        image.metadata.setdefault('rev_trans', rev_trans)
+        return image
+
+    @staticmethod
+    def get_center_scale(bbox, image_w, image_h):
+        aspect_ratio = 0.75
+        bbox[0] = np.max((0, bbox[0]))
+        bbox[1] = np.max((0, bbox[1]))
+        x2 = np.min((image_w - 1, bbox[0] + np.max((0, bbox[2] - 1))))
+        y2 = np.min((image_h - 1, bbox[1] + np.max((0, bbox[3] - 1))))
+        if x2 >= bbox[0] and y2 >= bbox[1]:
+            bbox = [bbox[0], bbox[1], x2 - bbox[0], y2 - bbox[1]]
+        cx_bbox = bbox[0] + bbox[2] * 0.5
+        cy_bbox = bbox[1] + bbox[3] * 0.5
+        center = np.array([np.float32(cx_bbox), np.float32(cy_bbox)])
+        if bbox[2] > aspect_ratio * bbox[3]:
+            bbox[3] = bbox[2] * 1.0 / aspect_ratio
+        elif bbox[2] < aspect_ratio * bbox[3]:
+            bbox[2] = bbox[3] * aspect_ratio
+
+        scale = np.array([bbox[2] / 200., bbox[3] / 200.], np.float32) * 1.25
+
+        return center, scale
+
+
+    @staticmethod
+    def get_transformation_matrix(center, scale, output_size, key=0):
+        w, _ = scale * 200
+        shift_y = [0, -w * 0.5]
+        shift_x = [-w * 0.5, 0]
+        points = np.array([center, center + shift_x, center + shift_y], dtype=np.float32)
+        transformed_points = np.array([
+            [output_size[0] * 0.5, output_size[1] * 0.5],
+            [0, output_size[1] * 0.5],
+            [output_size[0] * 0.5, output_size[1] * 0.5 - output_size[0] * 0.5]], dtype=np.float32)
+        if key == 0:
+            trans = cv2.getAffineTransform(np.float32(points), np.float32(transformed_points))
+        else:
+            trans = cv2.getAffineTransform(np.float32(transformed_points), np.float32(points))
+        return trans
+
+
+class ImagePyramid(Preprocessor):
+    __provider__ = 'pyramid'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update(
+            {
+                'min_size': NumberField(value_type=int, min_value=1, description='min side size for pyramid layer'),
+                'factor': NumberField(value_type=float, description='scale factor for pyramid layers')
+            }
+        )
+
+        return parameters
+
+    def configure(self):
+        self.min_size = self.get_value_from_config('min_size')
+        self.factor = self.get_value_from_config('factor')
+
+    def process(self, image, annotation_meta=None):
+        data = image.data.astype(float)
+        height, width, _ = data.shape
+        min_layer = min(height, width)
+        m = 12.0 / self.min_size
+        min_layer = min_layer * m
+        scales = []
+        factor_count = 0
+        while min_layer >= 12:
+            scales.append(m * pow(self.factor, factor_count))
+            min_layer *= self.factor
+            factor_count += 1
+        scaled_data = []
+        for scale in scales:
+            hs = int(np.ceil(height * scale))
+            ws = int(np.ceil(width * scale))
+            scaled_data.append(cv2.resize(data, (ws, hs)))
+
+        image.data = scaled_data
+        image.metadata.update({'multi_infer': True, 'scales': scales})
+
+        return image
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessing_executor.py b/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessing_executor.py
index 96c7557c98b..7060d4374a2 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessing_executor.py
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessing_executor.py
@@ -15,14 +15,14 @@
 """
 
 from ..config import ConfigValidator, StringField
-from .preprocessor import Preprocessor
+from .preprocessor import Preprocessor, MULTI_INFER_PREPROCESSORS
 
 
 class PreprocessingExecutor:
     def __init__(self, processors=None, dataset_name='custom', dataset_meta=None, input_shapes=None):
         self.processors = []
         self.dataset_meta = dataset_meta
-        self.input_shapes = input_shapes
+        self._multi_infer_transformations = False
 
         if not processors:
             return
@@ -36,11 +36,16 @@ def __init__(self, processors=None, dataset_name='custom', dataset_meta=None, in
             type_ = processor.get(identifier)
             preprocessor_config.validate(processor, type_)
             preprocessor = Preprocessor.provide(
-                processor[identifier], config=processor, name=type_, input_shapes=input_shapes
+                processor[identifier], config=processor, name=type_
             )
+            if processor[identifier] in MULTI_INFER_PREPROCESSORS:
+                self._multi_infer_transformations = True
 
             self.processors.append(preprocessor)
 
+        if input_shapes is not None:
+            self.input_shapes = input_shapes
+
     def __call__(self, context, *args, **kwargs):
         batch_data = context.data_batch
         batch_annotation = context.annotation_batch
@@ -55,6 +60,20 @@ def process(self, images, batch_annotation=None):
 
         return images
 
+    @property
+    def has_multi_infer_transformations(self):
+        return self._multi_infer_transformations
+
+    @property
+    def input_shapes(self):
+        return self._input_shapes
+
+    @input_shapes.setter
+    def input_shapes(self, input_shapes):
+        self._input_shapes = input_shapes
+        for preprocessor in self.processors:
+            preprocessor.set_input_shape(input_shapes)
+
 
 class PreprocessorConfig(ConfigValidator):
     type = StringField(choices=Preprocessor.providers)
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessor.py b/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessor.py
index 577a61ce338..7a5196f2625 100644
--- a/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessor.py
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/preprocessor.py
@@ -19,13 +19,16 @@
 from ..utils import get_parameter_value_from_config
 
 
+MULTI_INFER_PREPROCESSORS = ['tiling', 'normalize3d', 'image_pyramid']
+
+
 class Preprocessor(ClassProvider):
     __provider_type__ = 'preprocessor'
 
-    def __init__(self, config, name=None, input_shapes=None):
+    def __init__(self, config, name=None):
         self.config = config
         self.name = name
-        self.input_shapes = input_shapes
+        self.input_shapes = None
 
         self.validate_config()
         self.configure()
@@ -54,3 +57,6 @@ def validate_config(self):
         ConfigValidator(
             self.name, on_extra_argument=ConfigValidator.ERROR_ON_EXTRA_ARGUMENT, fields=self.parameters()
         ).validate(self.config)
+
+    def set_input_shape(self, input_shape):
+        pass
diff --git a/tools/accuracy_checker/accuracy_checker/preprocessor/resize.py b/tools/accuracy_checker/accuracy_checker/preprocessor/resize.py
new file mode 100644
index 00000000000..c17d23365a9
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/preprocessor/resize.py
@@ -0,0 +1,402 @@
+import cv2
+import numpy as np
+
+from ..config import ConfigError, NumberField, StringField, BoolField
+from ..dependency import ClassProvider
+from ..logging import warning
+from ..preprocessor import Preprocessor, GeometricOperationMetadata
+from ..utils import contains_all, get_size_from_config
+
+try:
+    from PIL import Image
+except ImportError:
+    Image = None
+
+try:
+    import tensorflow as tf
+except ImportError:
+    tf = None
+
+def scale_width(dst_width, dst_height, image_width, image_height,):
+    return int(dst_width * image_width / image_height), dst_height
+
+
+def scale_height(dst_width, dst_height, image_width, image_height):
+    return dst_width, int(dst_height * image_height / image_width)
+
+
+def scale_greater(dst_width, dst_height, image_width, image_height):
+    if image_height > image_width:
+        return scale_height(dst_width, dst_height, image_width, image_height)
+    return scale_width(dst_width, dst_height, image_width, image_height)
+
+
+def scale_fit_to_window(dst_width, dst_height, image_width, image_height):
+    im_scale = min(dst_height / image_height, dst_width / image_width)
+    return int(im_scale * image_width), int(im_scale * image_height)
+
+
+def frcnn_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
+    min_size = min(dst_width, dst_height)
+    max_size = max(dst_width, dst_height)
+    w1, h1 = scale_greater(min_size, min_size, image_width, image_height)
+    if max(w1, h1) <= max_size:
+        return w1, h1
+
+    return scale_fit_to_window(max_size, max_size, image_width, image_height)
+
+
+def ctpn_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
+    scale = min(dst_height, dst_width)
+    max_scale = max(dst_height, dst_width)
+    im_min_size = min(image_width, image_height)
+    im_max_size = max(image_width, image_height)
+    im_scale = float(scale) / float(im_min_size)
+    if np.round(im_scale * im_max_size) > max_scale:
+        im_scale = float(max_scale) / float(im_max_size)
+    new_h = np.round(image_height * im_scale)
+    new_w = np.round(image_width * im_scale)
+    return int(new_w), int(new_h)
+
+
+def east_keep_aspect_ratio(dst_width, dst_height, image_width, image_height):
+    resize_w = image_width
+    resize_h = image_height
+    max_side_len = max(dst_width, dst_height)
+    min_side_len = min(dst_width, dst_height)
+
+    # limit the max side
+    if max(resize_h, resize_w) > max_side_len:
+        ratio = float(max_side_len) / resize_h if resize_h > resize_w else float(max_side_len) / resize_w
+    else:
+        ratio = 1.
+    resize_h = int(resize_h * ratio)
+    resize_w = int(resize_w * ratio)
+
+    resize_h = resize_h if resize_h % min_side_len == 0 else (resize_h // min_side_len - 1) * min_side_len
+    resize_w = resize_w if resize_w % min_side_len == 0 else (resize_w // min_side_len - 1) * min_side_len
+    resize_h = max(32, resize_h)
+    resize_w = max(32, resize_w)
+
+    return resize_w, resize_h
+
+
+ASPECT_RATIO_SCALE = {
+    'width': scale_width,
+    'height': scale_height,
+    'greater': scale_greater,
+    'fit_to_window': scale_fit_to_window,
+    'frcnn_keep_aspect_ratio': frcnn_keep_aspect_ratio,
+    'ctpn_keep_aspect_ratio': ctpn_keep_aspect_ratio,
+    'east_keep_aspect_ratio': east_keep_aspect_ratio
+}
+
+
+class _Resizer(ClassProvider):
+    __provider_type__ = 'resizer'
+
+    default_interpolation = None
+
+    def __init__(self, interpolation=None):
+        if not interpolation:
+            interpolation = self.default_interpolation
+        if interpolation.upper() not in self.supported_interpolations():
+            raise ConfigError('{} not found for {}'.format(self.supported_interpolations(), self.__provider__))
+        self.interpolation = self.supported_interpolations().get(interpolation.upper(), self.default_interpolation)
+
+    def resize(self, data, new_height, new_width):
+        raise NotImplementedError
+
+    def __call__(self, data, new_height, new_width):
+        return self.resize(data, new_height, new_width)
+
+    @classmethod
+    def all_provided_interpolations(cls):
+        interpolations = set()
+        for _, provider_class in cls.providers.items():
+            try:
+                interpolations.update(provider_class.supported_interpolations())
+            except ImportError:
+                continue
+        return interpolations
+
+    @classmethod
+    def supported_interpolations(cls):
+        return {}
+
+
+class _OpenCVResizer(_Resizer):
+    __provider__ = 'opencv'
+
+    _supported_interpolations = {
+        'NEAREST': cv2.INTER_NEAREST,
+        'LINEAR': cv2.INTER_LINEAR,
+        'CUBIC': cv2.INTER_CUBIC,
+        'AREA': cv2.INTER_AREA,
+        'MAX': cv2.INTER_MAX,
+        'BITS': cv2.INTER_BITS,
+        'BITS2': cv2.INTER_BITS2,
+        'LANCZOS4': cv2.INTER_LANCZOS4,
+    }
+    default_interpolation = 'LINEAR'
+
+    def resize(self, data, new_height, new_width):
+        return cv2.resize(data, (new_width, new_height), interpolation=self.interpolation).astype(np.float32)
+
+    @classmethod
+    def supported_interpolations(cls):
+        return cls._supported_interpolations
+
+
+class _PillowResizer(_Resizer):
+    __provider__ = 'pillow'
+    default_interpolation = 'BILINEAR'
+
+    def __init__(self, interpolation):
+        if Image is None:
+            raise ImportError(
+                'pillow backend for resize operation requires TensorFlow. Please install it before usage.'
+            )
+        self._supported_interpolations = {
+            'NEAREST': Image.NEAREST,
+            'NONE': Image.NONE,
+            'BILINEAR': Image.BILINEAR,
+            'LINEAR': Image.LINEAR,
+            'BICUBIC': Image.BICUBIC,
+            'CUBIC': Image.CUBIC,
+            'ANTIALIAS': Image.ANTIALIAS,
+        }
+        try:
+            optional_interpolations = {
+                'BOX': Image.BOX,
+                'LANCZOS': Image.LANCZOS,
+                'HAMMING': Image.HAMMING,
+            }
+            self._supported_interpolations.update(optional_interpolations)
+        except AttributeError:
+            pass
+        super().__init__(interpolation)
+
+    def resize(self, data, new_height, new_width):
+        data = Image.fromarray(data)
+        data = data.resize((new_width, new_height), self.interpolation)
+        data = np.array(data)
+
+        return data
+
+    @classmethod
+    def supported_interpolations(cls):
+        if Image is None:
+            return {}
+        intrp = {
+            'NEAREST': Image.NEAREST,
+            'NONE': Image.NONE,
+            'BILINEAR': Image.BILINEAR,
+            'LINEAR': Image.LINEAR,
+            'BICUBIC': Image.BICUBIC,
+            'CUBIC': Image.CUBIC,
+            'ANTIALIAS': Image.ANTIALIAS
+        }
+        try:
+            optional_interpolations = {
+                'BOX': Image.BOX,
+                'LANCZOS': Image.LANCZOS,
+                'HAMMING': Image.HAMMING,
+            }
+            intrp.update(optional_interpolations)
+        except AttributeError:
+            pass
+        return intrp
+
+
+class _TFResizer(_Resizer):
+    __provider__ = 'tf'
+    _supported_interpolations = {}
+
+    def __init__(self, interpolation):
+        if tf is None:
+            raise ImportError('tf backend for resize operation requires TensorFlow. Please install it before usage.')
+        tf.enable_eager_execution()
+        self._supported_interpolations = {
+            'BILINEAR': tf.image.ResizeMethod.BILINEAR,
+            'AREA': tf.image.ResizeMethod.AREA,
+            'BICUBIC': tf.image.ResizeMethod.BICUBIC,
+        }
+        self.default_interpolation = 'BILINEAR'
+        self._resize = tf.image.resize_images
+
+        super().__init__(interpolation)
+
+    def resize(self, data, new_height, new_width):
+        resized_data = self._resize(data, [new_height, new_width], method=self.interpolation)
+        return resized_data.numpy()
+
+    @classmethod
+    def supported_interpolations(cls):
+        if tf is None:
+            return {}
+        return cls._supported_interpolations
+
+
+def create_resizer(config):
+    resize_realization = config.get('resize_realization')
+    interpolation = config.get('interpolation')
+
+    def provided_both_resizer(additional_flag):
+        return contains_all(config, ['resize_realization', additional_flag])
+
+    def select_resizer_by_flags(use_pil, use_tf):
+        if use_pil and use_tf:
+            raise ConfigError('Pillow and TensorFlow flags both provided. Please select only one resize method.')
+        if use_pil:
+            return 'pillow'
+        if use_tf:
+            return 'tf'
+        return 'opencv'
+
+    if resize_realization:
+        if provided_both_resizer('use_pillow') or provided_both_resizer('use_tensorflow'):
+            warning(
+                'resize_realization and flag: {} both provided. resize_realization: {} will be used.'.format(
+                    'use_pillow' if 'use_pillow' in config else 'use_tensorflow', config['resize_realization']
+                )
+            )
+    else:
+        use_pillow, use_tesorfow = config.get('use_pillow', False), config.get('use_tensorflow', False)
+        resize_realization = select_resizer_by_flags(use_pillow, use_tesorfow)
+
+    return _Resizer.provide(resize_realization, interpolation)
+
+
+class Resize(Preprocessor):
+    __provider__ = 'resize'
+
+    @classmethod
+    def parameters(cls):
+        parameters = super().parameters()
+        parameters.update({
+            'size': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination sizes for both dimensions."
+            ),
+            'dst_width': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination width for image resizing."
+            ),
+            'dst_height': NumberField(
+                value_type=int, optional=True, min_value=1, description="Destination height for image resizing."
+            ),
+            'aspect_ratio_scale': StringField(
+                choices=ASPECT_RATIO_SCALE, optional=True,
+                description="Allows save image aspect ratio using one of these ways: "
+                            "{}".format(', '.join(ASPECT_RATIO_SCALE))
+            ),
+            'interpolation': StringField(
+                choices=_Resizer.all_provided_interpolations(), optional=True, default='LINEAR',
+                description="Specifies method that will be used."
+            ),
+            'use_pillow': BoolField(
+                optional=True, default=False,
+                description="Parameter specifies usage of Pillow library for resizing."
+            ),
+            'use_tensorflow': BoolField(
+                optional=True,
+                description="Specifies usage of TensorFlow Image for resizing. Requires TensorFlow installation."
+            ),
+            'resize_realization': StringField(
+                optional=True, choices=_Resizer.providers,
+                description="Parameter specifies functionality of which library will be used for resize: "
+                            "{}".format(', '.join(_Resizer.providers))
+            )
+        })
+
+        return parameters
+
+    def configure(self):
+        self.dst_height, self.dst_width = get_size_from_config(self.config)
+        self.resizer = create_resizer(self.config)
+        self.scaling_func = ASPECT_RATIO_SCALE.get(self.get_value_from_config('aspect_ratio_scale'))
+
+    def process(self, image, annotation_meta=None):
+        data = image.data
+        new_height, new_width = self.dst_height, self.dst_width
+
+        is_simple_case = not isinstance(data, list) # otherwise -- pyramid, tiling, etc
+
+        def process_data(data, new_height, new_width, scale_func, resize_func):
+            dst_width, dst_height = new_width, new_height
+            image_h, image_w = data.shape[:2]
+            if scale_func:
+                dst_width, dst_height = scale_func(new_width, new_height, image_w, image_h)
+
+            resize_meta = {}
+            resize_meta['preferable_width'] = max(dst_width, new_width)
+            resize_meta['preferable_height'] = max(dst_height, new_height)
+            resize_meta['image_info'] = [dst_height, dst_width, 1]
+            resize_meta['scale_x'] = float(dst_width) / image_w
+            resize_meta['scale_y'] = float(dst_height) / image_h
+            resize_meta['original_width'] = image_w
+            resize_meta['original_height'] = image_h
+
+            if is_simple_case:
+                # support GeometricOperationMetadata array for simple case only -- without tiling, pyramids, etc
+                image.metadata.setdefault(
+                    'geometric_operations', []).append(GeometricOperationMetadata('resize', resize_meta))
+
+            image.metadata.update(resize_meta)
+
+            data = resize_func(data, dst_height, dst_width)
+            if len(data.shape) == 2:
+                data = np.expand_dims(data, axis=-1)
+
+            return data
+
+        image.data = (
+            process_data(data, new_height, new_width, self.scaling_func, self.resizer)
+            if is_simple_case else [
+                process_data(data_fragment, new_height, new_width, self.scaling_func, self.resizer)
+                for data_fragment in data
+            ]
+        )
+
+        return image
+
+
+class AutoResize(Preprocessor):
+    __provider__ = 'auto_resize'
+
+    def __init__(self, config, name=None):
+        super().__init__(config, name)
+        self.dst_height = None
+        self.dst_width = None
+
+    def set_input_shape(self, input_shape):
+        if input_shape is None or len(input_shape) != 1:
+            raise ConfigError('resize to input size possible, only for one input layer case')
+        input_shape = next(iter(input_shape.values()))
+        self.dst_height, self.dst_width = input_shape[2:]
+
+    def process(self, image, annotation_meta=None):
+        is_simple_case = not isinstance(image.data, list)  # otherwise -- pyramid, tiling, etc
+        if self.dst_height is None or self.dst_width is None:
+            self.set_input_shape(self.input_shapes)
+
+        def process_data(data):
+            data = cv2.resize(data, (self.dst_width, self.dst_height)).astype(np.float32)
+            if len(data.shape) == 2:
+                data = np.expand_dims(data, axis=-1)
+
+            if is_simple_case:
+                # support GeometricOperationMetadata array for simple case only -- without tiling, pyramids, etc
+                image.metadata.setdefault('geometric_operations', []).append(
+                    GeometricOperationMetadata('auto_resize', {})
+                )
+
+            return data
+
+        data = image.data
+        image.data = (
+            process_data(data) if is_simple_case else [
+                process_data(data_fragment)for data_fragment in data
+            ]
+        )
+
+        return image
diff --git a/tools/accuracy_checker/accuracy_checker/presenters.py b/tools/accuracy_checker/accuracy_checker/presenters.py
index cb964655458..5e37101187e 100644
--- a/tools/accuracy_checker/accuracy_checker/presenters.py
+++ b/tools/accuracy_checker/accuracy_checker/presenters.py
@@ -15,9 +15,9 @@
 """
 
 from collections import namedtuple
-from enum import Enum
 import numpy as np
 
+from .utils import Color, color_format
 from .dependency import ClassProvider
 from .logging import print_info
 
@@ -28,28 +28,20 @@
 )
 
 
-class Color(Enum):
-    PASSED = 0
-    FAILED = 1
-
-
-def color_format(s, color=Color.PASSED):
-    if color == Color.PASSED:
-        return "\x1b[0;32m{}\x1b[0m".format(s)
-    return "\x1b[0;31m{}\x1b[0m".format(s)
-
-
 class BasePresenter(ClassProvider):
     __provider_type__ = "presenter"
 
-    def write_result(self, evaluation_result, output_callback=None, ignore_results_formatting=False):
+    def write_result(self, evaluation_result, ignore_results_formatting=False):
+        raise NotImplementedError
+
+    def extract_result(self, evaluation_result):
         raise NotImplementedError
 
 
 class ScalarPrintPresenter(BasePresenter):
     __provider__ = "print_scalar"
 
-    def write_result(self, evaluation_result: EvaluationResult, output_callback=None, ignore_results_formatting=False):
+    def write_result(self, evaluation_result: EvaluationResult, ignore_results_formatting=False):
         value, reference, name, _, threshold, meta = evaluation_result
         value = np.mean(value)
         postfix, scale, result_format = get_result_format_parameters(meta, ignore_results_formatting)
@@ -61,11 +53,21 @@ def write_result(self, evaluation_result: EvaluationResult, output_callback=None
             value, name, threshold, difference, postfix=postfix, scale=scale, result_format=result_format
         )
 
+    def extract_result(self, evaluation_result):
+        value, ref, name, metric_type, _, meta = evaluation_result
+        result_dict = {
+            'name': name,
+            'value': np.mean(value),
+            'type': metric_type,
+            'ref': ref or ''
+        }
+        return result_dict, meta
+
 
 class VectorPrintPresenter(BasePresenter):
     __provider__ = "print_vector"
 
-    def write_result(self, evaluation_result: EvaluationResult, output_callback=None, ignore_results_formatting=False):
+    def write_result(self, evaluation_result: EvaluationResult, ignore_results_formatting=False):
         value, reference, name, _, threshold, meta = evaluation_result
         if threshold:
             threshold = float(threshold)
@@ -109,6 +111,37 @@ def write_result(self, evaluation_result: EvaluationResult, output_callback=None
                 result_format=result_format
             )
 
+    def extract_result(self, evaluation_result):
+        value, reference, name, metric_type, _, meta = evaluation_result
+        value_names = ['{}@{}'.format(name, value_name) for value_name in meta.get('names', range(0, len(value)))]
+        if np.isscalar(value) or np.size(value) == 1:
+            if not np.isscalar(value):
+                value = value[0]
+            result_dict = {
+                'name': value_names[0] if 'names' in meta else name,
+                'value':value,
+                'type': metric_type,
+                'ref': reference or ''
+            }
+            return result_dict, meta
+        if meta.get('calculate_mean', True):
+            value_names.append('{}@mean'.format(name))
+            mean_value = np.mean(value)
+            value = np.append(value, mean_value)
+            meta['names'] = value_names
+        per_value_meta = [meta for _ in value_names]
+        results = []
+        for idx, value_item in enumerate(value):
+            results.append(
+                {
+                    'name': value_names[idx],
+                    'value': value_item,
+                    'type': metric_type,
+                    'ref': ''
+                }
+            )
+        return results, per_value_meta
+
 
 def write_scalar_result(
         res_value, name, threshold=None, diff_with_ref=None, value_name=None,
@@ -133,14 +166,6 @@ def compare_with_ref(reference, res_value, scale):
     return abs(reference - (res_value * scale))
 
 
-class ReturnValuePresenter(BasePresenter):
-    __provider__ = "return_value"
-
-    def write_result(self, evaluation_result: EvaluationResult, output_callback=None, ignore_results_formatting=False):
-        if output_callback:
-            output_callback(evaluation_result)
-
-
 def get_result_format_parameters(meta, use_default_formatting):
     postfix = ' '
     scale = 1
diff --git a/tools/accuracy_checker/accuracy_checker/progress_reporters.py b/tools/accuracy_checker/accuracy_checker/progress_reporters.py
index c37202cc6c3..eb4029587af 100644
--- a/tools/accuracy_checker/accuracy_checker/progress_reporters.py
+++ b/tools/accuracy_checker/accuracy_checker/progress_reporters.py
@@ -15,8 +15,12 @@
 """
 
 import time
+import warnings
 
-from tqdm import tqdm
+try:
+    from tqdm import tqdm
+except ImportError:
+    tqdm = None
 
 from .dependency import ClassProvider
 from .logging import print_info
@@ -85,17 +89,33 @@ def update(self, batch_id, batch_size):
 class TQDMReporter(ProgressReporter):
     __provider__ = 'bar'
 
-    def update(self, _batch_id, batch_size):
+    def __init__(self, dataset_size=None, **kwargs):
+        super().__init__(dataset_size)
+        if tqdm is None:
+            warnings.warn('tqdm is not available, progress switched to print')
+        self.tqdm_reporter = tqdm
+        self.progress_printer = PrintProgressReporter(dataset_size, print_interval=1)
+
+    def update(self, batch_id, batch_size):
         self.current += batch_size
-        self.tqdm.update(batch_size)
+        if self.tqdm_reporter:
+            self.tqdm_reporter.update(batch_size)
+        else:
+            self.progress_printer.update(batch_id, batch_size)
 
     def finish(self, objects_processed=True):
-        self.tqdm.close()
-        super().finish(objects_processed)
+        if self.tqdm_reporter:
+            self.tqdm_reporter.close() #pylint: disable=E1120
+            super().finish(objects_processed)
+        else:
+            self.progress_printer.finish(objects_processed)
 
     def reset(self, dataset_size):
         super().reset(dataset_size)
-        self.tqdm = tqdm(
-            total=self.dataset_size, unit='frames', leave=False,
-            bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]'
-        )
+        if self.tqdm_reporter:
+            self.tqdm_reporter = tqdm(
+                total=self.dataset_size, unit='frames', leave=False,
+                bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]'
+            )
+        else:
+            self.progress_printer.reset(dataset_size)
diff --git a/tools/accuracy_checker/accuracy_checker/representation/__init__.py b/tools/accuracy_checker/accuracy_checker/representation/__init__.py
index 81caaf60dbd..c036aaaa119 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/__init__.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/__init__.py
@@ -60,8 +60,15 @@
 from .super_resolution_representation import SuperResolutionAnnotation, SuperResolutionPrediction
 from .text_detection_representation import TextDetectionAnnotation, TextDetectionPrediction
 from .pose_estimation_representation import PoseEstimationAnnotation, PoseEstimationPrediction
+from .pose_estimation_3d_representation import PoseEstimation3dAnnotation, PoseEstimation3dPrediction
 from .hit_ratio_representation import HitRatio, HitRatioAnnotation, HitRatioPrediction
-from .nlp_representation import MachineTranslationAnnotation, MachineTranslationPrediction
+from .nlp_representation import (
+    MachineTranslationAnnotation,
+    MachineTranslationPrediction,
+    QuestionAnsweringAnnotation,
+    QuestionAnsweringPrediction,
+    TextClassificationAnnotation
+)
 
 __all__ = [
     'BaseRepresentation',
@@ -118,11 +125,16 @@
 
     'PoseEstimationAnnotation',
     'PoseEstimationPrediction',
+    'PoseEstimation3dAnnotation',
+    'PoseEstimation3dPrediction',
 
     'HitRatio',
     'HitRatioAnnotation',
     'HitRatioPrediction',
 
     'MachineTranslationAnnotation',
-    'MachineTranslationPrediction'
+    'MachineTranslationPrediction',
+    'QuestionAnsweringAnnotation',
+    'QuestionAnsweringPrediction',
+    'TextClassificationAnnotation'
 ]
diff --git a/tools/accuracy_checker/accuracy_checker/representation/nlp_representation.py b/tools/accuracy_checker/accuracy_checker/representation/nlp_representation.py
index 448ed900d0a..5dbc7c08655 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/nlp_representation.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/nlp_representation.py
@@ -1,4 +1,5 @@
 from .base_representation import BaseRepresentation
+from .classification_representation import ClassificationAnnotation
 
 
 class MachineTranslationRepresentation(BaseRepresentation):
@@ -16,3 +17,39 @@ class MachineTranslationPrediction(MachineTranslationRepresentation):
     def __init__(self, identifier, translation=''):
         super().__init__(identifier)
         self.translation = translation
+
+
+class QuestionAnswering(BaseRepresentation):
+    def __init__(self, identifier=''):
+        super().__init__(identifier)
+
+
+class QuestionAnsweringAnnotation(QuestionAnswering):
+    def __init__(self, identifier, unique_id, input_ids, input_mask, segment_ids, tokens, orig_answer_text=None):
+        super().__init__(identifier)
+        self.orig_answer_text = orig_answer_text if orig_answer_text is not None else ''
+        self.unique_id = unique_id
+        self.input_ids = input_ids
+        self.input_mask = input_mask
+        self.segment_ids = segment_ids
+        self.tokens = tokens
+
+
+class QuestionAnsweringPrediction(QuestionAnswering):
+    def __init__(self, identifier, start_logits, end_logits, start_index=None, end_index=None, tokens=None):
+        super().__init__(identifier)
+
+        self.start_logits = start_logits
+        self.end_logits = end_logits
+        self.start_index = start_index if start_index is not None else []
+        self.end_index = end_index if end_index is not None else []
+        self.tokens = tokens if tokens is not None else []
+
+
+class TextClassificationAnnotation(ClassificationAnnotation):
+    def __init__(self, identifier, label, input_ids, input_mask, segment_ids, tokens):
+        super().__init__(identifier, label)
+        self.input_ids = input_ids
+        self.input_mask = input_mask
+        self.segment_ids = segment_ids
+        self.tokens = tokens
diff --git a/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_3d_representation.py b/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_3d_representation.py
new file mode 100644
index 00000000000..047d61ce24d
--- /dev/null
+++ b/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_3d_representation.py
@@ -0,0 +1,58 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import numpy as np
+from .base_representation import BaseRepresentation
+from .pose_estimation_representation import PoseEstimationRepresentation
+
+
+class PoseEstimation3dRepresentation(BaseRepresentation):
+    def __init__(self, identifier='', x_values=None, y_values=None, visibility=None, labels=None,
+                 x_3d_values=None, y_3d_values=None, z_3d_values=None, fx=None):
+        super().__init__(identifier)
+        self.pose_2d = PoseEstimationRepresentation(identifier, x_values, y_values, visibility, labels)
+        self.x_3d_values = x_3d_values if np.size(x_3d_values) > 0 else np.array([])
+        self.y_3d_values = y_3d_values if np.size(y_3d_values) > 0 else np.array([])
+        self.z_3d_values = z_3d_values if np.size(z_3d_values) > 0 else np.array([])
+        self.fx = fx
+
+    @property
+    def bboxes(self):
+        if self.size == 0:
+            return []
+        x_mins, y_mins, x_maxs, y_maxs = [], [], [], []
+        for box_id in range(self.pose_2d.x_values.shape[0]):
+            x_mins.append(np.min(self.pose_2d.x_values[box_id][self.pose_2d.visibility[box_id] > 0]))
+            x_maxs.append(np.max(self.pose_2d.x_values[box_id][self.pose_2d.visibility[box_id] > 0]))
+            y_mins.append(np.min(self.pose_2d.y_values[box_id][self.pose_2d.visibility[box_id] > 0]))
+            y_maxs.append(np.max(self.pose_2d.y_values[box_id][self.pose_2d.visibility[box_id] > 0]))
+        return [[x_min, y_min, x_max, y_max] for x_min, y_min, x_max, y_max in zip(x_mins, y_mins, x_maxs, y_maxs)]
+
+    @property
+    def size(self):
+        return len(self.pose_2d.x_values)
+
+
+class PoseEstimation3dAnnotation(PoseEstimation3dRepresentation):
+    pass
+
+
+class PoseEstimation3dPrediction(PoseEstimation3dRepresentation):
+    def __init__(self, identifier='', x_values=None, y_values=None, visibility=None, scores=None,
+                 x_3d_values=None, y_3d_values=None, z_3d_values=None, labels=None, translations=None):
+        super().__init__(identifier, x_values, y_values, visibility, labels, x_3d_values, y_3d_values, z_3d_values)
+        self.scores = scores if scores is not None and np.size(scores) else np.array([])
+        self.translations = translations if translations is not None and np.size(translations) else np.array([])
diff --git a/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_representation.py b/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_representation.py
index 298711ad201..e1e20c5394c 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_representation.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/pose_estimation_representation.py
@@ -23,8 +23,8 @@ def __init__(self, identifier='', x_values=None, y_values=None, visibility=None,
         super().__init__(identifier)
         self.x_values = x_values if np.size(x_values) > 0 else []
         self.y_values = y_values if np.size(y_values) > 0 else []
-        self.visibility = visibility if np.size(visibility) > 0 else [2] * len(x_values)
-        self.labels = labels if labels is not None else np.array([1]*len(x_values))
+        self.visibility = visibility if np.size(visibility) > 0 else [2] * len(self.x_values)
+        self.labels = labels if labels is not None else np.array([1]*len(self.x_values))
 
     @property
     def areas(self):
diff --git a/tools/accuracy_checker/accuracy_checker/representation/regression_representation.py b/tools/accuracy_checker/accuracy_checker/representation/regression_representation.py
index 99800d36233..48bb73f4a69 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/regression_representation.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/regression_representation.py
@@ -49,8 +49,8 @@ class GazeVectorPrediction(GazeVectorRepresentation):
 class FacialLandmarksRepresentation(BaseRepresentation):
     def __init__(self, identifier='', x_values=None, y_values=None):
         super().__init__(identifier)
-        self.x_values = x_values if x_values.any() else []
-        self.y_values = y_values if y_values.any() else []
+        self.x_values = x_values if x_values is not None else []
+        self.y_values = y_values if y_values is not None else []
 
 
 class FacialLandmarksAnnotation(FacialLandmarksRepresentation):
diff --git a/tools/accuracy_checker/accuracy_checker/representation/segmentation_representation.py b/tools/accuracy_checker/accuracy_checker/representation/segmentation_representation.py
index a66487b0df7..34b8336b98b 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/segmentation_representation.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/segmentation_representation.py
@@ -34,12 +34,14 @@ class GTMaskLoader(Enum):
     SCIPY = 2
     NIFTI = 3
     NUMPY = 4
+    NIFTI_CHANNELS_FIRST = 5
 
 LOADERS_MAPPING = {
     'opencv': GTMaskLoader.OPENCV,
     'pillow': GTMaskLoader.PILLOW,
     'scipy': GTMaskLoader.SCIPY,
-    'nifty': GTMaskLoader.NIFTI,
+    'nifti': GTMaskLoader.NIFTI,
+    'nifti_channels_first': GTMaskLoader.NIFTI_CHANNELS_FIRST,
     'numpy': GTMaskLoader.NUMPY
 }
 
@@ -54,6 +56,7 @@ class SegmentationAnnotation(SegmentationRepresentation):
         GTMaskLoader.OPENCV: 'opencv_imread',
         GTMaskLoader.SCIPY: 'scipy_imread',
         GTMaskLoader.NIFTI: 'nifti_reader',
+        GTMaskLoader.NIFTI_CHANNELS_FIRST: {'type': 'nifti_reader', 'channels_first': True},
         GTMaskLoader.NUMPY: 'numpy_reader'
     }
 
@@ -80,7 +83,12 @@ def mask(self, value):
 
     def _load_mask(self):
         if self._mask is None:
-            loader = BaseReader.provide(self.LOADERS.get(self._mask_loader), self.metadata['data_source'])
+            loader_config = self.LOADERS.get(self._mask_loader)
+            data_source = self.metadata.get('segmentation_masks_source', self.metadata['data_source'])
+            if isinstance(loader_config, str):
+                loader = BaseReader.provide(loader_config, data_source)
+            else:
+                loader = BaseReader.provide(loader_config['type'], data_source, config=loader_config)
             if self._mask_loader == GTMaskLoader.PILLOW:
                 loader.convert_to_rgb = False
             mask = loader.read(self._mask_path)
@@ -108,7 +116,9 @@ def __init__(self, identifier, path_to_mask, loader=GTMaskLoader.NIFTI, box=None
 
 
 class BrainTumorSegmentationPrediction(SegmentationPrediction):
-    pass
+    def __init__(self, identifiers, mask, label_order=(0, 1, 2, 3)):
+        super().__init__(identifiers, mask)
+        self.label_order = label_order
 
 
 class CoCoInstanceSegmentationRepresentation(SegmentationRepresentation):
diff --git a/tools/accuracy_checker/accuracy_checker/representation/text_detection_representation.py b/tools/accuracy_checker/accuracy_checker/representation/text_detection_representation.py
index 4f138c81f17..23308ceaff2 100644
--- a/tools/accuracy_checker/accuracy_checker/representation/text_detection_representation.py
+++ b/tools/accuracy_checker/accuracy_checker/representation/text_detection_representation.py
@@ -20,11 +20,12 @@
 
 
 class TextDetectionRepresentation(BaseRepresentation):
-    def __init__(self, identifier='', points=None):
+    def __init__(self, identifier='', points=None, description=''):
         super().__init__(identifier)
         self.points = points if points is not None else []
         if isinstance(points, list):
             self.points = np.array(points)
+        self.description = description
 
     def remove(self, indexes):
         self.points = np.delete(self.points, indexes, axis=0)
@@ -32,6 +33,7 @@ def remove(self, indexes):
         if not difficult:
             return
         self.metadata['difficult_boxes'] = remove_difficult(difficult, indexes)
+        self.description = np.delete(self.description, indexes)
 
     @property
     def boxes(self):
@@ -49,13 +51,7 @@ def boxes(self):
 
 
 class TextDetectionAnnotation(TextDetectionRepresentation):
-    def __init__(self, identifier='', points=None, description=''):
-        super().__init__(identifier, points)
-        self.description = description
-
-    def remove(self, indexes):
-        super().remove(indexes)
-        self.description = np.delete(self.description, indexes)
+    pass
 
 
 class TextDetectionPrediction(TextDetectionRepresentation):
diff --git a/tools/accuracy_checker/accuracy_checker/statistics_collector/__init__.py b/tools/accuracy_checker/accuracy_checker/statistics_collector/__init__.py
deleted file mode 100644
index 160bbb83881..00000000000
--- a/tools/accuracy_checker/accuracy_checker/statistics_collector/__init__.py
+++ /dev/null
@@ -1,5 +0,0 @@
-from .statistics_collector import StatisticsCollector
-
-__all__ = [
-    'StatisticsCollector',
-]
diff --git a/tools/accuracy_checker/accuracy_checker/statistics_collector/statistics_collector.py b/tools/accuracy_checker/accuracy_checker/statistics_collector/statistics_collector.py
deleted file mode 100644
index 31519db1992..00000000000
--- a/tools/accuracy_checker/accuracy_checker/statistics_collector/statistics_collector.py
+++ /dev/null
@@ -1,48 +0,0 @@
-import numpy as np
-
-
-class Statistic:
-    def __init__(self, functor, batch_size):
-        self.iter_counter = 0
-        self.state = np.array([])
-        self.processor = functor
-        self.batch_size = batch_size
-
-    def update(self, activation):
-        an = self.processor(activation)
-        if self.iter_counter == 0:
-            self.state = an
-        else:
-            self.state = (self.state * self.iter_counter + an) / (self.iter_counter + 1)
-        self.iter_counter += 1
-
-    def update_on_batch(self, batch_a):
-        an_shape = np.shape(batch_a)
-        if an_shape[0] != self.batch_size:
-            self.update(batch_a)
-            return
-        for activation in batch_a:
-            self.update(activation)
-
-
-class StatisticsCollector:
-    def __init__(self, functors_mapping, batch=1):
-        self.statistics = {}
-        for layer_name, functors in functors_mapping.items():
-            self.statistics[layer_name] = [Statistic(functor, batch) for functor in functors]
-
-    def process_batch(self, outputs):
-        output_dict = outputs[0]
-        for layer_name, output in output_dict.items():
-            if layer_name not in self.statistics:
-                continue
-
-            for statistic in self.statistics[layer_name]:
-                statistic.update_on_batch(output)
-
-    def get_statistics(self):
-        per_layer_statistics = {}
-        for layer_name, layer_statistics in self.statistics.items():
-            per_layer_statistics[layer_name] = [statistic.state for statistic in layer_statistics]
-
-        return per_layer_statistics
diff --git a/tools/accuracy_checker/accuracy_checker/utils.py b/tools/accuracy_checker/accuracy_checker/utils.py
index e884b835f27..8308c1f7930 100644
--- a/tools/accuracy_checker/accuracy_checker/utils.py
+++ b/tools/accuracy_checker/accuracy_checker/utils.py
@@ -20,15 +20,14 @@
 import json
 import os
 import pickle
+from enum import Enum
 
 from pathlib import Path
 from typing import Union
 from warnings import warn
 from collections import MutableSet
 
-from shapely.geometry.polygon import Polygon
 import numpy as np
-import yamlloader
 import yaml
 
 try:
@@ -36,6 +35,16 @@
 except ImportError:
     import xml.etree.cElementTree as et
 
+try:
+    from shapely.geometry.polygon import Polygon
+except ImportError:
+    Polygon = None
+
+try:
+    from yamlloader.ordereddict import Loader as orddict_loader
+except ImportError:
+    orddict_loader = None
+
 
 def concat_lists(*lists):
     return list(itertools.chain(*lists))
@@ -274,6 +283,7 @@ def is_empty(string):
 def read_xml(file: Union[str, Path], *args, **kwargs):
     return et.parse(str(get_path(file)), *args, **kwargs).getroot()
 
+
 def read_json(file: Union[str, Path], *args, **kwargs):
     with get_path(file).open() as content:
         return json.load(content, *args, **kwargs)
@@ -286,7 +296,10 @@ def read_pickle(file: Union[str, Path], *args, **kwargs):
 
 def read_yaml(file: Union[str, Path], *args, **kwargs):
     with get_path(file).open() as content:
-        return yaml.load(content, *args, Loader=yamlloader.ordereddict.Loader, **kwargs)
+        loader = orddict_loader or yaml.SafeLoader
+        if not orddict_loader:
+            warn('yamlloader is not installed. YAML files order is not preserved. it can be sufficient for some cases')
+        return yaml.load(content, *args, Loader=loader, **kwargs)
 
 
 def read_csv(file: Union[str, Path], *args, **kwargs):
@@ -352,6 +365,8 @@ def to_lower_register(str_list):
 
 
 def polygon_from_points(points):
+    if Polygon is None:
+        raise ValueError('shapely is not installed, please install it')
     return Polygon(points)
 
 
@@ -488,3 +503,14 @@ def check_file_existence(file):
         return True
     except (FileNotFoundError, IsADirectoryError):
         return False
+
+
+class Color(Enum):
+    PASSED = 0
+    FAILED = 1
+
+
+def color_format(s, color=Color.PASSED):
+    if color == Color.PASSED:
+        return "\x1b[0;32m{}\x1b[0m".format(s)
+    return "\x1b[0;31m{}\x1b[0m".format(s)
diff --git a/tools/accuracy_checker/configs/Sphereface.yml b/tools/accuracy_checker/configs/Sphereface.yml
new file mode 100644
index 00000000000..e3f4951ef3d
--- /dev/null
+++ b/tools/accuracy_checker/configs/Sphereface.yml
@@ -0,0 +1,29 @@
+models:
+  - name: Sphereface
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/Sphereface/FP32/Sphereface.xml
+        weights: public/Sphereface/FP32/Sphereface.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/Sphereface/FP16/Sphereface.xml
+        weights: public/Sphereface/FP16/Sphereface.bin
+        adapter: reid
+
+    datasets:
+      - name: lfw
+
+        preprocessing:
+          - type: point_alignment
+            size: 400
+          - type: resize
+            dst_height: 112
+            dst_width: 96
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/action-recognition-0001-decoder.yml b/tools/accuracy_checker/configs/action-recognition-0001-decoder.yml
new file mode 100644
index 00000000000..d86c78bc542
--- /dev/null
+++ b/tools/accuracy_checker/configs/action-recognition-0001-decoder.yml
@@ -0,0 +1,60 @@
+evaluations:
+  - name: action-recognition-0001-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          predictions: kinetics/action-recognition-0001-encoder-predictions.pickle
+
+
+        decoder:
+          model:   intel/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.xml
+          weights: intel/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: kinetics-400
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+  - name: action-recognition-0001-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          predictions: kinetics/action-recognition-0001-encoder-predictions.pickle
+
+        decoder:
+          model:   intel/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.xml
+          weights: intel/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: kinetics-400
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/action-recognition-0001-encoder.yml b/tools/accuracy_checker/configs/action-recognition-0001-encoder.yml
new file mode 100644
index 00000000000..d8f84297fd9
--- /dev/null
+++ b/tools/accuracy_checker/configs/action-recognition-0001-encoder.yml
@@ -0,0 +1,69 @@
+evaluations:
+  - name: action-recognition-0001-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          model:   intel/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.xml
+          weights: intel/action-recognition-0001-encoder/FP32/action-recognition-0001-encoder.bin
+
+
+        decoder:
+          model:   intel/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.xml
+          weights: intel/action-recognition-0001-decoder/FP32/action-recognition-0001-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: kinetics-400
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+  - name: action-recognition-0001-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          model:   intel/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.xml
+          weights: intel/action-recognition-0001-encoder/FP16/action-recognition-0001-encoder.bin
+
+        decoder:
+          model:   intel/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.xml
+          weights: intel/action-recognition-0001-decoder/FP16/action-recognition-0001-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: kinetics-400
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/age-gender-recognition-retail-0013.yml b/tools/accuracy_checker/configs/age-gender-recognition-retail-0013.yml
index 17adf00df69..2ed1fc8b2bf 100644
--- a/tools/accuracy_checker/configs/age-gender-recognition-retail-0013.yml
+++ b/tools/accuracy_checker/configs/age-gender-recognition-retail-0013.yml
@@ -22,6 +22,16 @@ models:
           gender_out: prob
           age_out: age_conv3
 
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/age-gender-recognition-retail-0013/FP32-INT8/age-gender-recognition-retail-0013.xml
+        weights: intel/age-gender-recognition-retail-0013/FP32-INT8/age-gender-recognition-retail-0013.bin
+        adapter:
+          type: age_gender
+          gender_out: prob
+          age_out: age_conv3
+
     datasets:
       - name: age_gender
 
@@ -44,3 +54,5 @@ models:
             prediction_source: age_classification
 
           - type: mae
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/alexnet.yml b/tools/accuracy_checker/configs/alexnet.yml
index 3d983869944..b8f2bfb67c8 100644
--- a/tools/accuracy_checker/configs/alexnet.yml
+++ b/tools/accuracy_checker/configs/alexnet.yml
@@ -43,6 +43,8 @@ models:
           - name: accuracy@top1
             type: accuracy
             top_k: 1
-          - name: acciracy@top5
+          - name: accuracy@top5
             type: accuracy
             top_k: 5
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/asl-recognition-0004.yml b/tools/accuracy_checker/configs/asl-recognition-0004.yml
new file mode 100644
index 00000000000..8081762bbea
--- /dev/null
+++ b/tools/accuracy_checker/configs/asl-recognition-0004.yml
@@ -0,0 +1,43 @@
+models:
+  - name: asl-recognition-0004
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/asl-recognition-0004/FP32/asl-recognition-0004.xml
+        weights: intel/asl-recognition-0004/FP32/asl-recognition-0004.bin
+        adapter: classification
+        inputs:
+          - type: INPUT
+            name: input
+            layout: NCDHW
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/asl-recognition-0004/FP16/asl-recognition-0004.xml
+        weights: intel/asl-recognition-0004/FP16/asl-recognition-0004.bin
+        adapter: classification
+        inputs:
+          - type: INPUT
+            name: input
+            layout: NCDHW
+
+    datasets:
+    - name: msasl-100
+
+      preprocessing:
+        - type: resize
+          size: 256
+          aspect_ratio_scale: greater
+        - type: crop
+          size: 224
+        - type: bgr_to_rgb
+
+      metrics:
+        - type: accuracy
+          name: rank@1
+          top_k: 1
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/brain-tumor-segmentation-0001.yml b/tools/accuracy_checker/configs/brain-tumor-segmentation-0001.yml
new file mode 100644
index 00000000000..67a8952a2c3
--- /dev/null
+++ b/tools/accuracy_checker/configs/brain-tumor-segmentation-0001.yml
@@ -0,0 +1,35 @@
+models:
+  - name: brain-tumor-segmentation-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/brain-tumor-segmentation-0001/FP32/brain-tumor-segmentation-0001.xml
+        weights: public/brain-tumor-segmentation-0001/FP32/brain-tumor-segmentation-0001.bin
+        adapter:
+          type: brain_tumor_segmentation
+          make_argmax: True
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/brain-tumor-segmentation-0001/FP16/brain-tumor-segmentation-0001.xml
+        weights: public/brain-tumor-segmentation-0001/FP16/brain-tumor-segmentation-0001.bin
+        adapter:
+          type: brain_tumor_segmentation
+          make_argmax: True
+
+    datasets:
+      - name: BraTS
+
+        metrics:
+          # ground truth mean            [0.9239, 0.7114, 0.8205, 0.7271]
+          # UNCROPPED: ground truth mean [0.9266, 0.7256, 0.8205, 0.7268]
+          # ground truth median             [0.9316, 0.7714, 0.8535, 0.8456]
+          # UNCROPPED: ground truth median  [0.9339, 0.7918, 0.8603, 0.8576]
+          - type: dice_index
+            median: True
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/brain-tumor-segmentation-0002.yml b/tools/accuracy_checker/configs/brain-tumor-segmentation-0002.yml
new file mode 100755
index 00000000000..f2e41a6938e
--- /dev/null
+++ b/tools/accuracy_checker/configs/brain-tumor-segmentation-0002.yml
@@ -0,0 +1,42 @@
+models:
+  - name: brain-tumor-segmentation-0002
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/brain-tumor-segmentation-0002/FP32/brain-tumor-segmentation-0002.xml
+        weights: public/brain-tumor-segmentation-0002/FP32/brain-tumor-segmentation-0002.bin
+        adapter:
+            type: brain_tumor_segmentation
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/brain-tumor-segmentation-0002/FP16/brain-tumor-segmentation-0002.xml
+        weights: public/brain-tumor-segmentation-0002/FP16/brain-tumor-segmentation-0002.bin
+        adapter:
+            type: brain_tumor_segmentation
+
+    datasets:
+      - name: BraTS_2017
+        preprocessing:
+          - type: swap_modalities
+            modality_order: [1,2,3,0]
+          - type: crop_brats
+          - type: normalize_brats
+            masked: ignore
+          - type: resize3d
+            size: (128,128,128)
+        postprocessing:
+          - type: segmentation_prediction_resample
+          - type: transform_brats_prediction
+            order: [0,1,2]
+            values: [1,2,3]
+
+        metrics:
+          - type: dice_index
+            median: True
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/caffenet.yml b/tools/accuracy_checker/configs/caffenet.yml
index 6b7e9a26787..03941396dfc 100644
--- a/tools/accuracy_checker/configs/caffenet.yml
+++ b/tools/accuracy_checker/configs/caffenet.yml
@@ -38,3 +38,5 @@ models:
             size: 256
           - type: crop
             size: 227
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/colorization-v2-norebal.yml b/tools/accuracy_checker/configs/colorization-v2-norebal.yml
new file mode 100644
index 00000000000..24e783c3015
--- /dev/null
+++ b/tools/accuracy_checker/configs/colorization-v2-norebal.yml
@@ -0,0 +1,66 @@
+evaluations:
+  - name: colorization-v2-norebal
+    module: custom_evaluators.colorization_evaluator.ColorizationEvaluator
+    module_config:
+        network_info:
+          colorization_network:
+            model:   public/colorization-v2-norebal/FP32/colorization-v2-norebal.xml
+            weights: public/colorization-v2-norebal/FP32/colorization-v2-norebal.bin
+            color_coeff: public/colorization-v2-norebal/colorization-v2-norebal.npy
+
+          verification_network:
+            model:   public/vgg16/FP32/vgg16.xml
+            weights: public/vgg16/FP32/vgg16.bin
+            adapter: classification
+
+        launchers:
+          - framework: dlsdk
+            tags:
+              - FP32
+
+        datasets:
+          - name: imagenet_1000_classes
+            reader: pillow_imread
+
+            preprocessing:
+            -   type: resize
+                size: 256
+                aspect_ratio_scale: greater
+            -   type: crop
+                size: 224
+            -   type: normalization
+                std:  255
+
+  - name: colorization-v2-norebal
+    module: custom_evaluators.colorization_evaluator.ColorizationEvaluator
+    module_config:
+        network_info:
+          colorization_network:
+            model:   public/colorization-v2-norebal/FP16/colorization-v2-norebal.xml
+            weights: public/colorization-v2-norebal/FP16/colorization-v2-norebal.bin
+            color_coeff: public/colorization-v2-norebal/colorization-v2-norebal.npy
+
+          verification_network:
+            model:   public/vgg16/FP32/vgg16.xml
+            weights: public/vgg16/FP32/vgg16.bin
+            adapter: classification
+
+        launchers:
+          - framework: dlsdk
+            tags:
+              - FP16
+
+        datasets:
+          - name: imagenet_1000_classes
+            reader: pillow_imread
+
+            preprocessing:
+            -   type: resize
+                size: 256
+                aspect_ratio_scale: greater
+            -   type: crop
+                size: 224
+            -   type: normalization
+                std:  255
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/colorization-v2.yml b/tools/accuracy_checker/configs/colorization-v2.yml
new file mode 100644
index 00000000000..491b213f842
--- /dev/null
+++ b/tools/accuracy_checker/configs/colorization-v2.yml
@@ -0,0 +1,66 @@
+evaluations:
+  - name: colorization-v2
+    module: custom_evaluators.colorization_evaluator.ColorizationEvaluator
+    module_config:
+        network_info:
+          colorization_network:
+            model:   public/colorization-v2/FP32/colorization-v2.xml
+            weights: public/colorization-v2/FP32/colorization-v2.bin
+            color_coeff: public/colorization-v2/colorization-v2.npy
+
+          verification_network:
+            model:   public/vgg16/FP32/vgg16.xml
+            weights: public/vgg16/FP32/vgg16.bin
+            adapter: classification
+
+        launchers:
+          - framework: dlsdk
+            tags:
+              - FP32
+
+        datasets:
+          - name: imagenet_1000_classes
+            reader: pillow_imread
+
+            preprocessing:
+            -   type: resize
+                size: 256
+                aspect_ratio_scale: greater
+            -   type: crop
+                size: 224
+            -   type: normalization
+                std:  255
+
+  - name: colorization-v2
+    module: custom_evaluators.colorization_evaluator.ColorizationEvaluator
+    module_config:
+        network_info:
+          colorization_network:
+            model:   public/colorization-v2/FP16/colorization-v2.xml
+            weights: public/colorization-v2/FP16/colorization-v2.bin
+            color_coeff: public/colorization-v2/colorization-v2.npy
+
+          verification_network:
+            model:   public/vgg16/FP32/vgg16.xml
+            weights: public/vgg16/FP32/vgg16.bin
+            adapter: classification
+
+        launchers:
+          - framework: dlsdk
+            tags:
+              - FP16
+
+        datasets:
+          - name: imagenet_1000_classes
+            reader: pillow_imread
+
+            preprocessing:
+            -   type: resize
+                size: 256
+                aspect_ratio_scale: greater
+            -   type: crop
+                size: 224
+            -   type: normalization
+                std:  255
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ctdet_coco_dlav0_384.yml b/tools/accuracy_checker/configs/ctdet_coco_dlav0_384.yml
new file mode 100644
index 00000000000..f89a4e71981
--- /dev/null
+++ b/tools/accuracy_checker/configs/ctdet_coco_dlav0_384.yml
@@ -0,0 +1,45 @@
+models:
+  - name: ctdet_coco_dlav0_384
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/ctdet_coco_dlav0_384/FP32/ctdet_coco_dlav0_384.xml
+        weights: public/ctdet_coco_dlav0_384/FP32/ctdet_coco_dlav0_384.bin
+        adapter:
+          type: ctdet
+          center_heatmap_out: "508"
+          width_height_out: "514"
+          regression_out: "511"
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/ctdet_coco_dlav0_384/FP16/ctdet_coco_dlav0_384.xml
+        weights: public/ctdet_coco_dlav0_384/FP16/ctdet_coco_dlav0_384.bin
+        adapter:
+          type: ctdet
+          center_heatmap_out: "508"
+          width_height_out: "514"
+          regression_out: "511"
+
+
+    datasets:
+      - name: ms_coco_detection_80_class_without_backgound
+        preprocessing:
+          - type: centernet_affine_transform
+            dst_width: 384
+            dst_height: 384
+
+        postprocessing:
+          - type: filter
+            apply_to: prediction
+            min_confidence: 0.3
+            remove_filtered: True
+
+        metrics:
+          - type: map
+            integral: 11point
+            presenter: print_scalar
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ctdet_coco_dlav0_512.yml b/tools/accuracy_checker/configs/ctdet_coco_dlav0_512.yml
new file mode 100644
index 00000000000..c0e107cf696
--- /dev/null
+++ b/tools/accuracy_checker/configs/ctdet_coco_dlav0_512.yml
@@ -0,0 +1,45 @@
+models:
+  - name: ctdet_coco_dlav0_512
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/ctdet_coco_dlav0_512/FP32/ctdet_coco_dlav0_512.xml
+        weights: public/ctdet_coco_dlav0_512/FP32/ctdet_coco_dlav0_512.bin
+        adapter:
+          type: ctdet
+          center_heatmap_out: "508"
+          width_height_out: "514"
+          regression_out: "511"
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/ctdet_coco_dlav0_512/FP16/ctdet_coco_dlav0_512.xml
+        weights: public/ctdet_coco_dlav0_512/FP16/ctdet_coco_dlav0_512.bin
+        adapter:
+          type: ctdet
+          center_heatmap_out: "508"
+          width_height_out: "514"
+          regression_out: "511"
+
+
+    datasets:
+      - name: ms_coco_detection_80_class_without_backgound
+        preprocessing:
+          - type: centernet_affine_transform
+            dst_width: 512
+            dst_height: 512
+
+        postprocessing:
+          - type: filter
+            apply_to: prediction
+            min_confidence: 0.3
+            remove_filtered: True
+
+        metrics:
+          - type: map
+            integral: 11point
+            presenter: print_scalar
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ctpn.yml b/tools/accuracy_checker/configs/ctpn.yml
new file mode 100644
index 00000000000..d971e832550
--- /dev/null
+++ b/tools/accuracy_checker/configs/ctpn.yml
@@ -0,0 +1,61 @@
+models:
+  - name: ctpn
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/ctpn/FP32/ctpn.xml
+        weights: public/ctpn/FP32/ctpn.bin
+        adapter:
+          type: ctpn_text_detection
+          cls_prob_out: 'Reshape_2/Transpose'
+          bbox_pred_out: 'rpn_bbox_pred/Reshape_1/Transpose'
+        allow_reshape_input: True
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/ctpn/FP16/ctpn.xml
+        weights: public/ctpn/FP16/ctpn.bin
+        adapter:
+          type: ctpn_text_detection
+          cls_prob_out: 'Reshape_2/Transpose'
+          bbox_pred_out: 'rpn_bbox_pred/Reshape_1/Transpose'
+        allow_reshape_input: True
+
+    datasets:
+      - name: ICDAR2015
+
+        preprocessing:
+          - type: resize
+            dst_width: 1200
+            dst_height: 600
+            aspect_ratio_scale: ctpn_keep_aspect_ratio
+          - type: resize
+            dst_width: 600
+            dst_height: 600
+
+        postprocessing:
+          - type: cast_to_int
+            round_policy: lower
+
+        metrics:
+          - type: focused_text_precision
+            name: precision
+            ignore_difficult: True
+            area_recall_constrain: 0.8
+            area_precision_constrain: 0.4
+
+          - type: focused_text_recall
+            name: recall
+            ignore_difficult: True
+            area_recall_constrain: 0.8
+            area_precision_constrain: 0.4
+
+          - type: focused_text_hmean
+            name: hmean
+            ignore_difficult: True
+            area_recall_constrain: 0.8
+            area_precision_constrain: 0.4
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/deeplabv3.yml b/tools/accuracy_checker/configs/deeplabv3.yml
index 095dccd89f5..d67d8f7d798 100644
--- a/tools/accuracy_checker/configs/deeplabv3.yml
+++ b/tools/accuracy_checker/configs/deeplabv3.yml
@@ -7,7 +7,6 @@ models:
         model:   public/deeplabv3/FP32/deeplabv3.xml
         weights: public/deeplabv3/FP32/deeplabv3.bin
         adapter: segmentation
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -15,7 +14,6 @@ models:
         model:   public/deeplabv3/FP16/deeplabv3.xml
         weights: public/deeplabv3/FP16/deeplabv3.bin
         adapter: segmentation
-        cpu_extensions: AUTO
 
     datasets:
       - name: VOC2012_Segmentation
@@ -31,3 +29,5 @@ models:
           - type: mean_iou
             use_argmax: false
             presenter: print_scalar
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-121-caffe2.yml b/tools/accuracy_checker/configs/densenet-121-caffe2.yml
new file mode 100644
index 00000000000..c9a56922bb6
--- /dev/null
+++ b/tools/accuracy_checker/configs/densenet-121-caffe2.yml
@@ -0,0 +1,46 @@
+models:
+
+  - name: densenet-121-caffe2
+    launchers:
+      - framework: onnx_runtime
+        model: public/densenet-121-caffe2/densenet-121.onnx
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+          - type: normalization
+            mean: 103.94,116.78,123.68
+            std: 58.8235294
+
+  - name: densenet-121-caffe2
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/densenet-121-caffe2/FP32/densenet-121-caffe2.xml
+        weights: public/densenet-121-caffe2/FP32/densenet-121-caffe2.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/densenet-121-caffe2/FP16/densenet-121-caffe2.xml
+        weights: public/densenet-121-caffe2/FP16/densenet-121-caffe2.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-121-tf.yml b/tools/accuracy_checker/configs/densenet-121-tf.yml
index 6d552cb39ac..1158efb9882 100644
--- a/tools/accuracy_checker/configs/densenet-121-tf.yml
+++ b/tools/accuracy_checker/configs/densenet-121-tf.yml
@@ -22,3 +22,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-121.yml b/tools/accuracy_checker/configs/densenet-121.yml
index 583841f147e..f9a078493dd 100644
--- a/tools/accuracy_checker/configs/densenet-121.yml
+++ b/tools/accuracy_checker/configs/densenet-121.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-161-tf.yml b/tools/accuracy_checker/configs/densenet-161-tf.yml
index 3d643ce6f39..6ff1ef86467 100644
--- a/tools/accuracy_checker/configs/densenet-161-tf.yml
+++ b/tools/accuracy_checker/configs/densenet-161-tf.yml
@@ -22,3 +22,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-161.yml b/tools/accuracy_checker/configs/densenet-161.yml
index 74ec8962d4d..95cf48ee126 100644
--- a/tools/accuracy_checker/configs/densenet-161.yml
+++ b/tools/accuracy_checker/configs/densenet-161.yml
@@ -5,6 +5,7 @@ models:
         model:   public/densenet-161/densenet-161.prototxt
         weights: public/densenet-161/densenet-161.caffemodel
         adapter: classification
+
     datasets:
       - name: imagenet_1000_classes
         preprocessing:
@@ -39,3 +40,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-169-tf.yml b/tools/accuracy_checker/configs/densenet-169-tf.yml
index 5ae3f06e8eb..4dc7a63d0fd 100644
--- a/tools/accuracy_checker/configs/densenet-169-tf.yml
+++ b/tools/accuracy_checker/configs/densenet-169-tf.yml
@@ -22,3 +22,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-169.yml b/tools/accuracy_checker/configs/densenet-169.yml
index 4c407a70520..c602275b3ba 100644
--- a/tools/accuracy_checker/configs/densenet-169.yml
+++ b/tools/accuracy_checker/configs/densenet-169.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/densenet-201.yml b/tools/accuracy_checker/configs/densenet-201.yml
index e6ab1db0c2e..a92b61b700d 100644
--- a/tools/accuracy_checker/configs/densenet-201.yml
+++ b/tools/accuracy_checker/configs/densenet-201.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-decoder.yml b/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-decoder.yml
new file mode 100644
index 00000000000..bae8234c41e
--- /dev/null
+++ b/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-decoder.yml
@@ -0,0 +1,58 @@
+evaluations:
+  - name: driver-action-recognition-adas-0002-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          predictions: kinetics/driver-action-recognition-encoder-predictions.pickle
+
+        decoder:
+          model:   intel/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.xml
+          weights: intel/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: driver_action_recognition_dataset
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+
+  - name: driver-action-recognition-adas-0002-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          predictions: kinetics/driver-action-recognition-encoder-predictions.pickle
+
+        decoder:
+          model:   intel/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.xml
+          weights: intel/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: driver_action_recognition_dataset
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-encoder.yml b/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-encoder.yml
new file mode 100644
index 00000000000..cc32b975739
--- /dev/null
+++ b/tools/accuracy_checker/configs/driver-action-recognition-adas-0002-encoder.yml
@@ -0,0 +1,67 @@
+evaluations:
+  - name: driver-action-recognition-adas-0002-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          model:   intel/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.xml
+          weights: intel/driver-action-recognition-adas-0002-encoder/FP32/driver-action-recognition-adas-0002-encoder.bin
+
+        decoder:
+          model:   intel/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.xml
+          weights: intel/driver-action-recognition-adas-0002-decoder/FP32/driver-action-recognition-adas-0002-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: driver_action_recognition_dataset
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+
+  - name: driver-action-recognition-adas-0002-encoder
+    module: custom_evaluators.sequential_action_recognition_evaluator.SequentialActionRecognitionEvaluator
+    module_config:
+      network_info:
+        encoder:
+          model:   intel/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.xml
+          weights: intel/driver-action-recognition-adas-0002-encoder/FP16/driver-action-recognition-adas-0002-encoder.bin
+
+        decoder:
+          model:   intel/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.xml
+          weights: intel/driver-action-recognition-adas-0002-decoder/FP16/driver-action-recognition-adas-0002-decoder.bin
+          num_processing_frames: 16
+          adapter: classification
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: driver_action_recognition_dataset
+
+          preprocessing:
+            - type: resize
+              size: 224
+              aspect_ratio_scale: fit_to_window
+            - type: crop
+              size: 224
+
+          metrics:
+            - type: clip_accuracy
+              presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b0-pytorch.yml b/tools/accuracy_checker/configs/efficientnet-b0-pytorch.yml
new file mode 100644
index 00000000000..eff295b2918
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b0-pytorch.yml
@@ -0,0 +1,67 @@
+models:
+  - name: efficientnet-b0-pytorch
+
+    launchers:
+      - framework: onnx_runtime
+        model: public/efficientnet-b0-pytorch/efficientnet-b0.onnx
+        adapter: classification
+        inputs:
+          - name: data
+            type: INPUT
+            shape: 1,3,224,224
+
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+
+          - type: crop
+            use_pillow: True
+            size: 224
+
+          - type: normalization
+            mean: (123.675,116.28,103.53)
+            std: (58.395,57.12,57.375)
+
+  - name: efficientnet-b0-pytorch
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b0-pytorch/FP32/efficientnet-b0-pytorch.xml
+        weights: public/efficientnet-b0-pytorch/FP32/efficientnet-b0-pytorch.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b0-pytorch/FP16/efficientnet-b0-pytorch.xml
+        weights: public/efficientnet-b0-pytorch/FP16/efficientnet-b0-pytorch.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: rgb_to_bgr
+
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+
+          - type: crop
+            use_pillow: True
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b0.yml b/tools/accuracy_checker/configs/efficientnet-b0.yml
new file mode 100644
index 00000000000..c49b467cd1f
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b0.yml
@@ -0,0 +1,56 @@
+models:
+  - name: efficientnet-b0
+
+    launchers:
+      - framework: tf
+        model: public/efficientnet-b0/efficientnet-b0/model.ckpt.meta
+        adapter: classification
+        output_names:
+          - logits
+        inputs:
+          - name: IteratorGetNext
+            type: INPUT
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 224
+            use_pillow: True
+            interpolation: BICUBIC
+
+  - name: efficientnet-b0
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b0/FP32/efficientnet-b0.xml
+        weights: public/efficientnet-b0/FP32/efficientnet-b0.bin
+        adapter: classification
+        cpu_extensions: AUTO
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b0/FP16/efficientnet-b0.xml
+        weights: public/efficientnet-b0/FP16/efficientnet-b0.bin
+        adapter: classification
+        cpu_extensions: AUTO
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 224
+            use_pillow: True
+            interpolation: BICUBIC
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b0_auto_aug.yml b/tools/accuracy_checker/configs/efficientnet-b0_auto_aug.yml
new file mode 100644
index 00000000000..835085813dd
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b0_auto_aug.yml
@@ -0,0 +1,55 @@
+models:
+  - name: efficientnet-b0_auto_aug
+
+    launchers:
+      - framework: tf
+        model: public/efficientnet-b0_auto_aug/efficientnet-b0/model.ckpt.meta
+        adapter: classification
+        output_names:
+          - logits
+        inputs:
+          - name: IteratorGetNext
+            type: INPUT
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 224
+            use_pillow: True
+            interpolation: BICUBIC
+
+
+  - name: efficientnet-b0_auto_aug
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b0_auto_aug/FP32/efficientnet-b0_auto_aug.xml
+        weights: public/efficientnet-b0_auto_aug/FP32/efficientnet-b0_auto_aug.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b0_auto_aug/FP16/efficientnet-b0_auto_aug.xml
+        weights: public/efficientnet-b0_auto_aug/FP16/efficientnet-b0_auto_aug.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 224
+            use_pillow: True
+            interpolation: BICUBIC
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b5-pytorch.yml b/tools/accuracy_checker/configs/efficientnet-b5-pytorch.yml
new file mode 100644
index 00000000000..c3f2f8a7b03
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b5-pytorch.yml
@@ -0,0 +1,66 @@
+models:
+  - name: efficientnet-b5-pytorch
+
+    launchers:
+      - framework: onnx_runtime
+        model: public/efficientnet-b5-pytorch/efficientnet-b5-pytorch.onnx
+        adapter: classification
+        inputs:
+          - name: data
+            type: INPUT
+            shape: 1,3,456,456
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: resize
+            size: 488
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+            # Crop ratio 0.934
+          - type: crop
+            use_pillow: True
+            size: 456
+
+          - type: normalization
+            mean: (123.675,116.28,103.53)
+            std: (58.395,57.12,57.375)
+
+  - name: efficientnet-b5-pytorch
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b5-pytorch/FP32/efficientnet-b5-pytorch.xml
+        weights: public/efficientnet-b5-pytorch/FP32/efficientnet-b5-pytorch.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b5-pytorch/FP16/efficientnet-b5-pytorch.xml
+        weights: public/efficientnet-b5-pytorch/FP16/efficientnet-b5-pytorch.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: rgb_to_bgr
+
+          - type: resize
+            size: 488
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+            # Crop ration 0.934
+          - type: crop
+            use_pillow: True
+            size: 456
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b5.yml b/tools/accuracy_checker/configs/efficientnet-b5.yml
new file mode 100644
index 00000000000..ab6f3d8eb62
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b5.yml
@@ -0,0 +1,54 @@
+models:
+  - name: efficientnet-b5
+
+    launchers:
+      - framework: tf
+        model: public/efficientnet-b5/efficientnet-b5/model.ckpt.meta
+        adapter: classification
+        output_names:
+          - logits
+        inputs:
+          - name: IteratorGetNext
+            type: INPUT
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 456
+            use_pillow: True
+            interpolation: BICUBIC
+
+  - name: efficientnet-b5
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b5/FP32/efficientnet-b5.xml
+        weights: public/efficientnet-b5/FP32/efficientnet-b5.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b5/FP16/efficientnet-b5.xml
+        weights: public/efficientnet-b5/FP16/efficientnet-b5.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 456
+            use_pillow: True
+            interpolation: BICUBIC
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b7-pytorch.yml b/tools/accuracy_checker/configs/efficientnet-b7-pytorch.yml
new file mode 100644
index 00000000000..3cbddbee1c1
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b7-pytorch.yml
@@ -0,0 +1,67 @@
+models:
+  - name: efficientnet-b7-pytorch
+
+    launchers:
+      - framework: onnx_runtime
+        model: public/efficientnet-b7-pytorch/efficientnet-b7-pytorch.onnx
+        adapter: classification
+        inputs:
+          - name: data
+            type: INPUT
+            shape: 1,3,600,600
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: resize
+            size: 632
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+            # Crop ratio 0.949
+          - type: crop
+            use_pillow: True
+            size: 600
+
+          - type: normalization
+            mean: (123.675,116.28,103.53)
+            std: (58.395,57.12,57.375)
+
+  - name: efficientnet-b7-pytorch
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b7-pytorch/FP32/efficientnet-b7-pytorch.xml
+        weights: public/efficientnet-b7-pytorch/FP32/efficientnet-b7-pytorch.bin
+        adapter: classification
+
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b7-pytorch/FP16/efficientnet-b7-pytorch.xml
+        weights: public/efficientnet-b7-pytorch/FP16/efficientnet-b7-pytorch.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        preprocessing:
+          - type: rgb_to_bgr
+
+          - type: resize
+            size: 632
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BICUBIC
+            # Crop ratio 0.949
+          - type: crop
+            use_pillow: True
+            size: 600
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/efficientnet-b7_auto_aug.yml b/tools/accuracy_checker/configs/efficientnet-b7_auto_aug.yml
new file mode 100644
index 00000000000..21df6b203d1
--- /dev/null
+++ b/tools/accuracy_checker/configs/efficientnet-b7_auto_aug.yml
@@ -0,0 +1,54 @@
+models:
+  - name: efficientnet-b7_auto_aug
+
+    launchers:
+      - framework: tf
+        model: public/efficientnet-b7_auto_aug/efficientnet-b7/model.ckpt.meta
+        adapter: classification
+        output_names:
+          - logits
+        inputs:
+          - name: IteratorGetNext
+            type: INPUT
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 600
+            use_pillow: True
+            interpolation: BICUBIC
+
+  - name: efficientnet-b7_auto_aug
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/efficientnet-b7_auto_aug/FP32/efficientnet-b7_auto_aug.xml
+        weights: public/efficientnet-b7_auto_aug/FP32/efficientnet-b7_auto_aug.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/efficientnet-b7_auto_aug/FP16/efficientnet-b7_auto_aug.xml
+        weights: public/efficientnet-b7_auto_aug/FP16/efficientnet-b7_auto_aug.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+            use_pillow: True
+          - type: resize
+            size: 600
+            use_pillow: True
+            interpolation: BICUBIC
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/emotions-recognition-retail-0003.yml b/tools/accuracy_checker/configs/emotions-recognition-retail-0003.yml
index caed4eacb6f..39d0f8a4e3f 100644
--- a/tools/accuracy_checker/configs/emotions-recognition-retail-0003.yml
+++ b/tools/accuracy_checker/configs/emotions-recognition-retail-0003.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.xml
         weights: intel/emotions-recognition-retail-0003/FP32/emotions-recognition-retail-0003.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,18 +15,18 @@ models:
         model:   intel/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.xml
         weights: intel/emotions-recognition-retail-0003/FP16/emotions-recognition-retail-0003.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/emotions-recognition-retail-0003/INT8/emotions-recognition-retail-0003.xml
-        weights: intel/emotions-recognition-retail-0003/INT8/emotions-recognition-retail-0003.bin
+          - FP32-INT8
+        model:   intel/emotions-recognition-retail-0003/FP32-INT8/emotions-recognition-retail-0003.xml
+        weights: intel/emotions-recognition-retail-0003/FP32-INT8/emotions-recognition-retail-0003.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: emotions_recognition
 
         metrics:
           - type: accuracy
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-detection-adas-0001.yml b/tools/accuracy_checker/configs/face-detection-adas-0001.yml
index 705ced7085e..65625abaa73 100644
--- a/tools/accuracy_checker/configs/face-detection-adas-0001.yml
+++ b/tools/accuracy_checker/configs/face-detection-adas-0001.yml
@@ -18,10 +18,9 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/face-detection-adas-0001/INT8/face-detection-adas-0001.xml
-        weights: intel/face-detection-adas-0001//INT8/face-detection-adas-0001.bin
+          - FP32-INT8
+        model:   intel/face-detection-adas-0001/FP32-INT8/face-detection-adas-0001.xml
+        weights: intel/face-detection-adas-0001/FP32-INT8/face-detection-adas-0001.bin
         adapter: ssd
 
     datasets:
@@ -44,3 +43,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-detection-adas-binary-0001.yml b/tools/accuracy_checker/configs/face-detection-adas-binary-0001.yml
index 6ed56b249c7..89b8bfe3b06 100644
--- a/tools/accuracy_checker/configs/face-detection-adas-binary-0001.yml
+++ b/tools/accuracy_checker/configs/face-detection-adas-binary-0001.yml
@@ -4,10 +4,9 @@ models:
     launchers:
       - framework: dlsdk
         tags:
-          - INT1
-        device: CPU
-        model:   intel/face-detection-adas-binary-0001/INT1/face-detection-adas-binary-0001.xml
-        weights: intel/face-detection-adas-binary-0001/INT1/face-detection-adas-binary-0001.bin
+          - FP32-INT1
+        model:   intel/face-detection-adas-binary-0001/FP32-INT1/face-detection-adas-binary-0001.xml
+        weights: intel/face-detection-adas-binary-0001/FP32-INT1/face-detection-adas-binary-0001.bin
         adapter: ssd
 
     datasets:
@@ -30,3 +29,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-detection-retail-0004.yml b/tools/accuracy_checker/configs/face-detection-retail-0004.yml
index 58dbf3bfcbb..0280ba6f42c 100644
--- a/tools/accuracy_checker/configs/face-detection-retail-0004.yml
+++ b/tools/accuracy_checker/configs/face-detection-retail-0004.yml
@@ -18,10 +18,9 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/face-detection-retail-0004/INT8/face-detection-retail-0004.xml
-        weights: intel/face-detection-retail-0004/INT8/face-detection-retail-0004.bin
+          - FP32-INT8
+        model:   intel/face-detection-retail-0004/FP32-INT8/face-detection-retail-0004.xml
+        weights: intel/face-detection-retail-0004/FP32-INT8/face-detection-retail-0004.bin
         adapter: ssd
 
     datasets:
@@ -48,3 +47,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: False
             distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-detection-retail-0005.yml b/tools/accuracy_checker/configs/face-detection-retail-0005.yml
index 78be4cbc3a4..e67e84cbab6 100644
--- a/tools/accuracy_checker/configs/face-detection-retail-0005.yml
+++ b/tools/accuracy_checker/configs/face-detection-retail-0005.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/face-detection-retail-0005/FP32/face-detection-retail-0005.xml
         weights: intel/face-detection-retail-0005/FP32/face-detection-retail-0005.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/face-detection-retail-0005/FP16/face-detection-retail-0005.xml
         weights: intel/face-detection-retail-0005/FP16/face-detection-retail-0005.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/face-detection-retail-0005/INT8/face-detection-retail-0005.xml
-        weights: intel/face-detection-retail-0005/INT8/face-detection-retail-0005.bin
+          - FP32-INT8
+        model:   intel/face-detection-retail-0005/FP32-INT8/face-detection-retail-0005.xml
+        weights: intel/face-detection-retail-0005/FP32-INT8/face-detection-retail-0005.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: wider
@@ -50,3 +47,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: True
             distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-detection-retail-0044.yml b/tools/accuracy_checker/configs/face-detection-retail-0044.yml
index 62302acdcff..2549c7a8889 100644
--- a/tools/accuracy_checker/configs/face-detection-retail-0044.yml
+++ b/tools/accuracy_checker/configs/face-detection-retail-0044.yml
@@ -3,7 +3,6 @@ models:
 
     launchers:
       - framework: caffe
-        device: CPU
         model:   public/face-detection-retail-0044/face-detection-retail-0044.prototxt
         weights: public/face-detection-retail-0044/face-detection-retail-0044.caffemodel
         adapter: ssd
@@ -14,7 +13,6 @@ models:
         model:   public/face-detection-retail-0044/FP32/face-detection-retail-0044.xml
         weights: public/face-detection-retail-0044/FP32/face-detection-retail-0044.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -22,11 +20,6 @@ models:
         model:   public/face-detection-retail-0044/FP16/face-detection-retail-0044.xml
         weights: public/face-detection-retail-0044/FP16/face-detection-retail-0044.bin
         adapter: ssd
-        mo_params:
-            data_type: FP16
-            input_shape: "[1,3,300,300]"
-            input: data
-            output: detection_out
 
     datasets:
       - name: wider
@@ -52,3 +45,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: False
             distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-recognition-mobilefacenet-arcface.yml b/tools/accuracy_checker/configs/face-recognition-mobilefacenet-arcface.yml
index fada39828a4..2d9e60e3b4d 100644
--- a/tools/accuracy_checker/configs/face-recognition-mobilefacenet-arcface.yml
+++ b/tools/accuracy_checker/configs/face-recognition-mobilefacenet-arcface.yml
@@ -6,28 +6,22 @@ models:
         model: public/face-recognition-mobilefacenet-arcface/model-y1-test2/model-0000.params
         adapter: reid
         inputs:
-        - name: data
-          type: INPUT
-          shape: 3, 112, 112
+          - name: data
+            type: INPUT
+            shape: 3, 112, 112
 
     datasets:
-        - name: lfw
-          data_source: LFW/lfw
-          annotation_conversion:
-            converter: lfw
-            pairs_file: LFW/annotation/pairs.txt
-            landmarks_file: LFW/annotation/lfw_landmark.txt
-          annotation: lfw.pickle
+      - name: lfw
 
-          preprocessing:
-            - type: bgr_to_rgb
-            - type: point_alignment
-              size: 400
-            - type: resize
-              size: 112
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: point_alignment
+            size: 400
+          - type: resize
+            size: 112
 
-          metrics:
-            - type: pairwise_accuracy_subsets
+        metrics:
+          - type: pairwise_accuracy_subsets
 
   - name: face-recognition-mobilefacenet-arcface
 
@@ -48,12 +42,6 @@ models:
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: point_alignment
@@ -61,5 +49,4 @@ models:
           - type: resize
             size: 112
 
-        metrics:
-          - type: pairwise_accuracy_subsets
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-recognition-resnet100-arcface.yml b/tools/accuracy_checker/configs/face-recognition-resnet100-arcface.yml
index 0c9f210eec0..4e4eaa4dc90 100644
--- a/tools/accuracy_checker/configs/face-recognition-resnet100-arcface.yml
+++ b/tools/accuracy_checker/configs/face-recognition-resnet100-arcface.yml
@@ -6,19 +6,12 @@ models:
         model: public/face-recognition-resnet100-arcface/model-r100-ii/model-0000.params
         adapter: reid
         inputs:
-        - name: data
-          type: INPUT
-          shape: 3, 112, 112
-
+          - name: data
+            type: INPUT
+            shape: 3, 112, 112
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: bgr_to_rgb
@@ -42,12 +35,6 @@ models:
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: point_alignment
@@ -55,5 +42,4 @@ models:
           - type: resize
             size: 112
 
-        metrics:
-          - type: pairwise_accuracy_subsets
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-recognition-resnet34-arcface.yml b/tools/accuracy_checker/configs/face-recognition-resnet34-arcface.yml
index c359fb11890..dfc92100de3 100644
--- a/tools/accuracy_checker/configs/face-recognition-resnet34-arcface.yml
+++ b/tools/accuracy_checker/configs/face-recognition-resnet34-arcface.yml
@@ -6,19 +6,12 @@ models:
         model: public/face-recognition-resnet34-arcface/model-r34-amf/model-0000.params
         adapter: reid
         inputs:
-        - name: data
-          type: INPUT
-          shape: 3, 112, 112
-
+          - name: data
+            type: INPUT
+            shape: 3, 112, 112
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: bgr_to_rgb
@@ -49,12 +42,6 @@ models:
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: point_alignment
@@ -62,5 +49,4 @@ models:
           - type: resize
             size: 112
 
-        metrics:
-          - type: pairwise_accuracy_subsets
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-recognition-resnet50-arcface.yml b/tools/accuracy_checker/configs/face-recognition-resnet50-arcface.yml
index 030e3970adc..a4bc38bd06f 100644
--- a/tools/accuracy_checker/configs/face-recognition-resnet50-arcface.yml
+++ b/tools/accuracy_checker/configs/face-recognition-resnet50-arcface.yml
@@ -6,18 +6,12 @@ models:
         model: public/face-recognition-resnet50-arcface/model-r50-am-lfw/model-0000.params
         adapter: reid
         inputs:
-        - name: data
-          type: INPUT
-          shape: 3, 112, 112
+          - name: data
+            type: INPUT
+            shape: 3, 112, 112
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: bgr_to_rgb
@@ -39,7 +33,6 @@ models:
         weights: public/face-recognition-resnet50-arcface//FP32/face-recognition-resnet50-arcface.bin
         adapter: reid
 
-
       - framework: dlsdk
         tags:
           - FP16
@@ -49,12 +42,6 @@ models:
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
-        annotation: lfw.pickle
 
         preprocessing:
           - type: point_alignment
@@ -62,5 +49,4 @@ models:
           - type: resize
             size: 112
 
-        metrics:
-          - type: pairwise_accuracy_subsets
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/face-reidentification-retail-0095.yml b/tools/accuracy_checker/configs/face-reidentification-retail-0095.yml
index 6442f395376..05287c0df5f 100644
--- a/tools/accuracy_checker/configs/face-reidentification-retail-0095.yml
+++ b/tools/accuracy_checker/configs/face-reidentification-retail-0095.yml
@@ -18,19 +18,13 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/face-reidentification-retail-0095/INT8/face-reidentification-retail-0095.xml
-        weights: intel/face-reidentification-retail-0095/INT8/face-reidentification-retail-0095.bin
+          - FP32-INT8
+        model:   intel/face-reidentification-retail-0095/FP32-INT8/face-reidentification-retail-0095.xml
+        weights: intel/face-reidentification-retail-0095/FP32-INT8/face-reidentification-retail-0095.bin
         adapter: reid
 
     datasets:
       - name: lfw
-        data_source: LFW/lfw
-        annotation_conversion:
-          converter: lfw
-          pairs_file: LFW/annotation/pairs.txt
-          landmarks_file: LFW/annotation/lfw_landmark.txt
 
         preprocessing:
           - type: point_alignment
@@ -38,5 +32,4 @@ models:
           - type: resize
             size: 128
 
-        metrics:
-          - type: pairwise_accuracy_subsets
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/facenet-20180408-102900.yml b/tools/accuracy_checker/configs/facenet-20180408-102900.yml
new file mode 100644
index 00000000000..7d89c2d2c08
--- /dev/null
+++ b/tools/accuracy_checker/configs/facenet-20180408-102900.yml
@@ -0,0 +1,28 @@
+models:
+  - name: facenet-20180408-102900
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/facenet-20180408-102900/FP32/facenet-20180408-102900.xml
+        weights: public/facenet-20180408-102900/FP32/facenet-20180408-102900.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/facenet-20180408-102900/FP16/facenet-20180408-102900.xml
+        weights: public/facenet-20180408-102900/FP16/facenet-20180408-102900.bin
+        adapter: reid
+
+    datasets:
+      - name: lfw
+
+        preprocessing:
+          - type: point_alignment
+            size: 400
+          - type: resize
+            size: 160
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/facial-landmarks-35-adas-0002.yml b/tools/accuracy_checker/configs/facial-landmarks-35-adas-0002.yml
index d32ac764d9e..674d054262f 100644
--- a/tools/accuracy_checker/configs/facial-landmarks-35-adas-0002.yml
+++ b/tools/accuracy_checker/configs/facial-landmarks-35-adas-0002.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.xml
         weights: intel/facial-landmarks-35-adas-0002/FP32/facial-landmarks-35-adas-0002.bin
         adapter: landmarks_regression
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,7 +15,13 @@ models:
         model:   intel/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.xml
         weights: intel/facial-landmarks-35-adas-0002/FP16/facial-landmarks-35-adas-0002.bin
         adapter: landmarks_regression
-        cpu_extensions: AUTO
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/facial-landmarks-35-adas-0002/FP32-INT8/facial-landmarks-35-adas-0002.xml
+        weights: intel/facial-landmarks-35-adas-0002/FP32-INT8/facial-landmarks-35-adas-0002.bin
+        adapter: landmarks_regression
 
     datasets:
       - name: facial_landmarks_35
@@ -26,3 +31,5 @@ models:
             calculate_std: True
             percentile: 90
             presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/faster_rcnn_inception_resnet_v2_atrous_coco.yml b/tools/accuracy_checker/configs/faster_rcnn_inception_resnet_v2_atrous_coco.yml
index 04ceb8c76fc..3c36a5d1f17 100644
--- a/tools/accuracy_checker/configs/faster_rcnn_inception_resnet_v2_atrous_coco.yml
+++ b/tools/accuracy_checker/configs/faster_rcnn_inception_resnet_v2_atrous_coco.yml
@@ -10,7 +10,7 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
       - framework: dlsdk
         tags:
@@ -21,14 +21,12 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
     datasets:
       - name: ms_coco_detection_91_classes
-        preprocessing:
-          - type: resize
-            size: 600
-        postprocessing:
-          - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+            max_detections: 100
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/faster_rcnn_inception_v2_coco.yml b/tools/accuracy_checker/configs/faster_rcnn_inception_v2_coco.yml
index ec477c239e5..4927d7b491b 100644
--- a/tools/accuracy_checker/configs/faster_rcnn_inception_v2_coco.yml
+++ b/tools/accuracy_checker/configs/faster_rcnn_inception_v2_coco.yml
@@ -10,8 +10,7 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
-
+            value: [[600, 1024, 1]]
       - framework: dlsdk
         tags:
           - FP16
@@ -21,14 +20,12 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
     datasets:
       - name: ms_coco_detection_91_classes
-        preprocessing:
-          - type: resize
-            size: 600
-        postprocessing:
-          - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+            max_detections: 100
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/faster_rcnn_resnet101_coco.yml b/tools/accuracy_checker/configs/faster_rcnn_resnet101_coco.yml
index 9d8dbb485b0..12aa6baaaac 100644
--- a/tools/accuracy_checker/configs/faster_rcnn_resnet101_coco.yml
+++ b/tools/accuracy_checker/configs/faster_rcnn_resnet101_coco.yml
@@ -10,7 +10,7 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
       - framework: dlsdk
         tags:
@@ -21,14 +21,12 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
     datasets:
       - name: ms_coco_detection_91_classes
-        preprocessing:
-          - type: resize
-            size: 600
-        postprocessing:
-          - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+            max_detections: 100
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/faster_rcnn_resnet50_coco.yml b/tools/accuracy_checker/configs/faster_rcnn_resnet50_coco.yml
index 2aa05c4a28c..9d16156c644 100644
--- a/tools/accuracy_checker/configs/faster_rcnn_resnet50_coco.yml
+++ b/tools/accuracy_checker/configs/faster_rcnn_resnet50_coco.yml
@@ -10,7 +10,7 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
       - framework: dlsdk
         tags:
@@ -21,14 +21,12 @@ models:
         inputs:
           - name: image_info
             type: CONST_INPUT
-            value: [[1, 600, 600]]
+            value: [[600, 1024, 1]]
 
     datasets:
       - name: ms_coco_detection_91_classes
-        preprocessing:
-          - type: resize
-            size: 600
-        postprocessing:
-          - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+            max_detections: 100
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/gaze-estimation-adas-0002.yml b/tools/accuracy_checker/configs/gaze-estimation-adas-0002.yml
new file mode 100644
index 00000000000..08c06721dc3
--- /dev/null
+++ b/tools/accuracy_checker/configs/gaze-estimation-adas-0002.yml
@@ -0,0 +1,63 @@
+models:
+  - name: gaze-estimation-adas-0002
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.xml
+        weights: intel/gaze-estimation-adas-0002/FP32/gaze-estimation-adas-0002.bin
+        inputs:
+          - name: left_eye_image
+            type: INPUT
+            value: ".*_left.png"
+          - name: right_eye_image
+            type: INPUT
+            value: ".*_right.png"
+          - name: 'head_pose_angles'
+            type: INPUT
+            value: ".*.json"
+        adapter: gaze_estimation
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.xml
+        weights: intel/gaze-estimation-adas-0002/FP16/gaze-estimation-adas-0002.bin
+        inputs:
+          - name: left_eye_image
+            type: INPUT
+            value: ".*_left.png"
+          - name: right_eye_image
+            type: INPUT
+            value: ".*_right.png"
+          - name: 'head_pose_angles'
+            type: INPUT
+            value: ".*.json"
+        adapter: gaze_estimation
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/gaze-estimation-adas-0002/FP32-INT8/gaze-estimation-adas-0002.xml
+        weights: intel/gaze-estimation-adas-0002/FP32-INT8/gaze-estimation-adas-0002.bin
+        inputs:
+          - name: left_eye_image
+            type: INPUT
+            value: ".*_left.png"
+          - name: right_eye_image
+            type: INPUT
+            value: ".*_right.png"
+          - name: 'head_pose_angles'
+            type: INPUT
+            value: ".*.json"
+        adapter: gaze_estimation
+
+    datasets:
+      - name: gaze_estimation_dataset
+
+        metrics:
+          - type: angle_error
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v1-tf.yml b/tools/accuracy_checker/configs/googlenet-v1-tf.yml
new file mode 100644
index 00000000000..7ca7685d155
--- /dev/null
+++ b/tools/accuracy_checker/configs/googlenet-v1-tf.yml
@@ -0,0 +1,45 @@
+models:
+  - name: googlenet-v1-tf
+    launchers:
+      - framework: tf
+        model: public/googlenet-v1-tf/inception_v1.frozen.pb
+        adapter: classification
+
+    dataset: 
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: normalization
+            mean: 127.5
+            std: 127.5
+          - type: crop
+            central_fraction: 0.875
+          - type: resize
+            size: 224
+
+
+  - name: googlenet-v1-tf
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/googlenet-v1-tf/FP32/googlenet-v1-tf.xml
+        weights: public/googlenet-v1-tf/FP32/googlenet-v1-tf.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/googlenet-v1-tf/FP16/googlenet-v1-tf.xml
+        weights: public/googlenet-v1-tf/FP16/googlenet-v1-tf.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+          - type: resize
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v1.yml b/tools/accuracy_checker/configs/googlenet-v1.yml
index 9b245a2bde1..747a3b6a00f 100644
--- a/tools/accuracy_checker/configs/googlenet-v1.yml
+++ b/tools/accuracy_checker/configs/googlenet-v1.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v2.yml b/tools/accuracy_checker/configs/googlenet-v2.yml
index d0d3c7b187b..693be9f3cbc 100644
--- a/tools/accuracy_checker/configs/googlenet-v2.yml
+++ b/tools/accuracy_checker/configs/googlenet-v2.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v3-pytorch.yml b/tools/accuracy_checker/configs/googlenet-v3-pytorch.yml
index 1c1a9cfe231..1063801869a 100644
--- a/tools/accuracy_checker/configs/googlenet-v3-pytorch.yml
+++ b/tools/accuracy_checker/configs/googlenet-v3-pytorch.yml
@@ -9,7 +9,7 @@ models:
           - name: data
             type: INPUT
             shape: 1,3,224,224
-      
+
     datasets:
       - name: imagenet_1000_classes
         # images read with Pillow
@@ -21,17 +21,14 @@ models:
             aspect_ratio_scale: greater
             use_pillow: true
             interpolation: BILINEAR
-          
           - type: crop
             size: 299
             use_pillow: true
-
           - type: normalization
             mean: 127.5
             std: 127.5
 
-        # Using accuracy metric, achieved result of public model - 77.45% and 93.56% (top 1 and top 5 respectively)
-
+            # Using accuracy metric, achieved result of public model - 77.45% and 93.56% (top 1 and top 5 respectively)
 
   - name: googlenet-v3-pytorch
 
@@ -43,7 +40,7 @@ models:
         model:   public/googlenet-v3-pytorch/FP32/googlenet-v3-pytorch.xml
         weights: public/googlenet-v3-pytorch/FP32/googlenet-v3-pytorch.bin
         adapter: classification
-      
+
       - framework: dlsdk
         tags:
           - FP16
@@ -59,15 +56,15 @@ models:
         # Image channels must be swapped, because "pillow_imread" reads in RGB, but converted model expect BGR
         preprocessing:
           - type: bgr_to_rgb
-
           - type: resize
             size: 320
             aspect_ratio_scale: greater
             use_pillow: true
             interpolation: BILINEAR
-          
           - type: crop
             size: 299
             use_pillow: true
 
-        # Using accuracy metric, achieved result of public model - 77.45% and 93.56% (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 77.45% and 93.56% (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v3.yml b/tools/accuracy_checker/configs/googlenet-v3.yml
index c68b05972cf..f4e68d2831d 100644
--- a/tools/accuracy_checker/configs/googlenet-v3.yml
+++ b/tools/accuracy_checker/configs/googlenet-v3.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 299
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v4-tf.yml b/tools/accuracy_checker/configs/googlenet-v4-tf.yml
new file mode 100644
index 00000000000..aa3d9ff59b4
--- /dev/null
+++ b/tools/accuracy_checker/configs/googlenet-v4-tf.yml
@@ -0,0 +1,45 @@
+models:
+  - name: googlenet-v4-tf
+    launchers:
+      - framework: tf
+        model: public/googlenet-v4-tf/inception_v4.frozen.pb
+        adapter: classification
+
+    dataset: 
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: normalization
+            mean: 127.5
+            std: 127.5
+          - type: crop
+            central_fraction: 0.875
+          - type: resize
+            size: 299
+
+
+  - name: googlenet-v4-tf
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/googlenet-v4-tf/FP32/googlenet-v4-tf.xml
+        weights: public/googlenet-v4-tf/FP32/googlenet-v4-tf.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/googlenet-v4-tf/FP16/googlenet-v4-tf.xml
+        weights: public/googlenet-v4-tf/FP16/googlenet-v4-tf.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: crop
+            central_fraction: 0.875
+          - type: resize
+            size: 299
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/googlenet-v4.yml b/tools/accuracy_checker/configs/googlenet-v4.yml
index 9e4c6173290..ea0ebe526b8 100644
--- a/tools/accuracy_checker/configs/googlenet-v4.yml
+++ b/tools/accuracy_checker/configs/googlenet-v4.yml
@@ -40,3 +40,5 @@ models:
             size: 320
           - type: crop
             size: 299
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/handwritten-score-recognition-0003.yml b/tools/accuracy_checker/configs/handwritten-score-recognition-0003.yml
new file mode 100644
index 00000000000..f5a1eb73090
--- /dev/null
+++ b/tools/accuracy_checker/configs/handwritten-score-recognition-0003.yml
@@ -0,0 +1,38 @@
+models:
+  - name: handwritten-score-recognition-0003
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.xml
+        weights: intel/handwritten-score-recognition-0003/FP32/handwritten-score-recognition-0003.bin
+        adapter: beam_search_decoder
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.xml
+        weights: intel/handwritten-score-recognition-0003/FP16/handwritten-score-recognition-0003.bin
+        adapter: beam_search_decoder
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/handwritten-score-recognition-0003/FP32-INT8/handwritten-score-recognition-0003.xml
+        weights: intel/handwritten-score-recognition-0003/FP32-INT8/handwritten-score-recognition-0003.bin
+        adapter: beam_search_decoder
+
+    datasets:
+      - name: handwritten_score_recognition
+
+        preprocessing:
+          - type: bgr_to_gray
+          - type: resize
+            dst_width: 64
+            dst_height: 32
+
+        metrics:
+          - type: character_recognition_accuracy
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/head-pose-estimation-adas-0001.yml b/tools/accuracy_checker/configs/head-pose-estimation-adas-0001.yml
new file mode 100644
index 00000000000..c732c061311
--- /dev/null
+++ b/tools/accuracy_checker/configs/head-pose-estimation-adas-0001.yml
@@ -0,0 +1,60 @@
+models:
+  - name: head-pose-estimation-adas-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.xml
+        weights: intel/head-pose-estimation-adas-0001/FP32/head-pose-estimation-adas-0001.bin
+        adapter:
+          type: head_pose
+          angle_yaw: angle_y_fc
+          angle_pitch: angle_p_fc
+          angle_roll: angle_r_fc
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.xml
+        weights: intel/head-pose-estimation-adas-0001/FP16/head-pose-estimation-adas-0001.bin
+        adapter:
+          type: head_pose
+          angle_yaw: angle_y_fc
+          angle_pitch: angle_p_fc
+          angle_roll: angle_r_fc
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/head-pose-estimation-adas-0001/FP32-INT8/head-pose-estimation-adas-0001.xml
+        weights: intel/head-pose-estimation-adas-0001/FP32-INT8/head-pose-estimation-adas-0001.bin
+        adapter:
+          type: head_pose
+          angle_yaw: angle_y_fc
+          angle_pitch: angle_p_fc
+          angle_roll: angle_r_fc
+
+    datasets:
+      - name: head_pose
+
+        metrics:
+          - name: yaw_mae
+            type: mae
+            presenter: print_vector
+            annotation_source: yaw
+            prediction_source: angle_yaw
+
+          - name: pitch_mae
+            type: mae
+            presenter: print_vector
+            annotation_source: pitch
+            prediction_source: angle_pitch
+
+          - name: roll_mae
+            type: mae
+            presenter: print_vector
+            annotation_source: roll
+            prediction_source: angle_roll
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/human-pose-estimation-0001.yml b/tools/accuracy_checker/configs/human-pose-estimation-0001.yml
index a6cdcd2d22b..09c4e2f1779 100644
--- a/tools/accuracy_checker/configs/human-pose-estimation-0001.yml
+++ b/tools/accuracy_checker/configs/human-pose-estimation-0001.yml
@@ -26,10 +26,9 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/human-pose-estimation-0001/INT8/human-pose-estimation-0001.xml
-        weights: intel/human-pose-estimation-0001/INT8/human-pose-estimation-0001.bin
+          - FP32-INT8
+        model:   intel/human-pose-estimation-0001/FP32-INT8/human-pose-estimation-0001.xml
+        weights: intel/human-pose-estimation-0001/FP32-INT8/human-pose-estimation-0001.bin
         allow_reshape_input: True
         adapter:
           type: human_pose_estimation
@@ -59,3 +58,5 @@ models:
           - name: AP
             type: coco_precision
             max_detections: 20
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/human-pose-estimation-3d-0001.yml b/tools/accuracy_checker/configs/human-pose-estimation-3d-0001.yml
new file mode 100644
index 00000000000..d6fe61d5814
--- /dev/null
+++ b/tools/accuracy_checker/configs/human-pose-estimation-3d-0001.yml
@@ -0,0 +1,46 @@
+models:
+  - name: human-pose-estimation-3d-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/human-pose-estimation-3d-0001/FP32/human-pose-estimation-3d-0001.xml
+        weights: public/human-pose-estimation-3d-0001/FP32/human-pose-estimation-3d-0001.bin
+        allow_reshape_input: True
+        adapter:
+          type: human_pose_estimation_3d
+          features_3d_out: features
+          keypoints_heatmap_out: heatmaps
+          part_affinity_fields_out: pafs
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/human-pose-estimation-3d-0001/FP16/human-pose-estimation-3d-0001.xml
+        weights: public/human-pose-estimation-3d-0001/FP16/human-pose-estimation-3d-0001.bin
+        allow_reshape_input: True
+        adapter:
+          type: human_pose_estimation_3d
+          features_3d_out: features
+          keypoints_heatmap_out: heatmaps
+          part_affinity_fields_out: pafs
+
+    datasets:
+      - name: cmu_panoptic_keypoints
+
+        preprocessing:
+          - type: resize
+            size: 256
+            interpolation: CUBIC
+            aspect_ratio_scale: width
+          - type: padding
+            stride: 8
+
+        postprocessing:
+          - type: translate_3d_poses
+
+        metrics:
+          - type: mpjpe_multiperson
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/image-retrieval-0001.yml b/tools/accuracy_checker/configs/image-retrieval-0001.yml
new file mode 100644
index 00000000000..fb930abbdb2
--- /dev/null
+++ b/tools/accuracy_checker/configs/image-retrieval-0001.yml
@@ -0,0 +1,36 @@
+models:
+  - name: image-retrieval-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/image-retrieval-0001/FP32/image-retrieval-0001.xml
+        weights: intel/image-retrieval-0001/FP32/image-retrieval-0001.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/image-retrieval-0001/FP16/image-retrieval-0001.xml
+        weights: intel/image-retrieval-0001/FP16/image-retrieval-0001.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/image-retrieval-0001/FP32-INT8/image-retrieval-0001.xml
+        weights: intel/image-retrieval-0001/FP32-INT8/image-retrieval-0001.bin
+        adapter: reid
+
+    datasets:
+      - name: image_retrieval
+
+        metrics:
+          - name: rank@1
+            type: cmc
+            top_k: 1
+
+          - type: reid_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/inception-resnet-v2-tf.yml b/tools/accuracy_checker/configs/inception-resnet-v2-tf.yml
index 7caf3e21e70..d25d17c054d 100644
--- a/tools/accuracy_checker/configs/inception-resnet-v2-tf.yml
+++ b/tools/accuracy_checker/configs/inception-resnet-v2-tf.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 299
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/inception-resnet-v2.yml b/tools/accuracy_checker/configs/inception-resnet-v2.yml
index 934c08c2ff3..4b475868d3b 100644
--- a/tools/accuracy_checker/configs/inception-resnet-v2.yml
+++ b/tools/accuracy_checker/configs/inception-resnet-v2.yml
@@ -37,3 +37,5 @@ models:
             size: 320
           - type: crop
             size: 299
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v1-tf-0001.yml b/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v1-tf-0001.yml
deleted file mode 100644
index a00f321c55d..00000000000
--- a/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v1-tf-0001.yml
+++ /dev/null
@@ -1,28 +0,0 @@
-models:
-  - name: inceptionv3-int8-sparse-v1-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/inceptionv3-int8-sparse-v1-tf-0001/FP32/inceptionv3-int8-sparse-v1-tf-0001.xml
-        weights: intel/inceptionv3-int8-sparse-v1-tf-0001/FP32/inceptionv3-int8-sparse-v1-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-    datasets:
-      - name: imagenet_1001_classes
-
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 299
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v2-tf-0001.yml b/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v2-tf-0001.yml
deleted file mode 100644
index 683f16411ff..00000000000
--- a/tools/accuracy_checker/configs/inceptionv3-int8-sparse-v2-tf-0001.yml
+++ /dev/null
@@ -1,28 +0,0 @@
-models:
-  - name: inceptionv3-int8-sparse-v2-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/inceptionv3-int8-sparse-v2-tf-0001/FP32/inceptionv3-int8-sparse-v2-tf-0001.xml
-        weights: intel/inceptionv3-int8-sparse-v2-tf-0001/FP32/inceptionv3-int8-sparse-v2-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-    datasets:
-      - name: imagenet_1001_classes
-
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 299
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/inceptionv3-int8-tf-0001.yml b/tools/accuracy_checker/configs/inceptionv3-int8-tf-0001.yml
deleted file mode 100644
index 4cbfbd5f8df..00000000000
--- a/tools/accuracy_checker/configs/inceptionv3-int8-tf-0001.yml
+++ /dev/null
@@ -1,29 +0,0 @@
-models:
-  - name: inceptionv3-int8-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/inceptionv3-int8-tf-0001/FP32/inceptionv3-int8-tf-0001.xml
-        weights: intel/inceptionv3-int8-tf-0001/FP32/inceptionv3-int8-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-
-    datasets:
-      - name: imagenet_1001_classes
-
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 299
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/instance-segmentation-security-0010.yml b/tools/accuracy_checker/configs/instance-segmentation-security-0010.yml
index 3f81db31b2f..926132b105a 100644
--- a/tools/accuracy_checker/configs/instance-segmentation-security-0010.yml
+++ b/tools/accuracy_checker/configs/instance-segmentation-security-0010.yml
@@ -13,7 +13,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -29,7 +28,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -54,3 +52,5 @@ models:
 
           - name: AP@boxes
             type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/instance-segmentation-security-0050.yml b/tools/accuracy_checker/configs/instance-segmentation-security-0050.yml
index 16cc200e6d0..f8613794a06 100644
--- a/tools/accuracy_checker/configs/instance-segmentation-security-0050.yml
+++ b/tools/accuracy_checker/configs/instance-segmentation-security-0050.yml
@@ -13,7 +13,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -29,7 +28,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -47,3 +45,5 @@ models:
 
           - name: AP@boxes
             type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/instance-segmentation-security-0083.yml b/tools/accuracy_checker/configs/instance-segmentation-security-0083.yml
index a8d33423f8b..49ab81d7b15 100644
--- a/tools/accuracy_checker/configs/instance-segmentation-security-0083.yml
+++ b/tools/accuracy_checker/configs/instance-segmentation-security-0083.yml
@@ -13,7 +13,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -29,7 +28,6 @@ models:
           scores_out: scores
           boxes_out: boxes
           raw_masks_out: raw_masks
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: IMAGE_INFO
@@ -54,3 +52,5 @@ models:
 
           - name: AP@boxes
             type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/landmarks-regression-retail-0009.yml b/tools/accuracy_checker/configs/landmarks-regression-retail-0009.yml
index e67924e8dd4..477e923fcb9 100644
--- a/tools/accuracy_checker/configs/landmarks-regression-retail-0009.yml
+++ b/tools/accuracy_checker/configs/landmarks-regression-retail-0009.yml
@@ -16,13 +16,15 @@ models:
         weights: intel/landmarks-regression-retail-0009/FP16/landmarks-regression-retail-0009.bin
         adapter: landmarks_regression
 
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/landmarks-regression-retail-0009/FP32-INT8/landmarks-regression-retail-0009.xml
+        weights: intel/landmarks-regression-retail-0009/FP32-INT8/landmarks-regression-retail-0009.bin
+        adapter: landmarks_regression
+
     datasets:
       - name: vgg2face
-        data_source: VGGFaces2/test
-        annotation_conversion:
-          converter: vgg_face
-          landmarks_csv_file: VGGFaces2/bb_landmark/loose_landmark_test.csv
-          bbox_csv_file: VGGFaces2/bb_landmark/loose_bb_test.csv
 
         preprocessing:
           - type: crop_rect
@@ -37,3 +39,5 @@ models:
           - type: per_point_normed_error
             presenter: print_vector
           - type: normed_error
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/license-plate-recognition-barrier-0001.yml b/tools/accuracy_checker/configs/license-plate-recognition-barrier-0001.yml
index df603c0051b..f280d2a0a95 100644
--- a/tools/accuracy_checker/configs/license-plate-recognition-barrier-0001.yml
+++ b/tools/accuracy_checker/configs/license-plate-recognition-barrier-0001.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.xml
         weights: intel/license-plate-recognition-barrier-0001/FP32/license-plate-recognition-barrier-0001.bin
         adapter: lpr
-        cpu_extensions: AUTO
         inputs:
           - name: seq_ind
             type: CONST_INPUT
@@ -20,7 +19,6 @@ models:
         model:   intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.xml
         weights: intel/license-plate-recognition-barrier-0001/FP16/license-plate-recognition-barrier-0001.bin
         adapter: lpr
-        cpu_extensions: AUTO
         inputs:
           - name: seq_ind
             type: CONST_INPUT
@@ -28,11 +26,10 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/license-plate-recognition-barrier-0001/INT8/license-plate-recognition-barrier-0001.xml
-        weights: intel/license-plate-recognition-barrier-0001/INT8/license-plate-recognition-barrier-0001.bin
+          - FP32-INT8
+        model:   intel/license-plate-recognition-barrier-0001/FP32-INT8/license-plate-recognition-barrier-0001.xml
+        weights: intel/license-plate-recognition-barrier-0001/FP32-INT8/license-plate-recognition-barrier-0001.bin
         adapter: lpr
-        cpu_extensions: AUTO
         inputs:
           - name: seq_ind
             type: CONST_INPUT
@@ -41,10 +38,7 @@ models:
     datasets:
       - name: synthetic_chinese_license_plates
 
-        preprocessing:
-          - type: resize
-            dst_width: 94
-            dst_height: 24
-
         metrics:
           - type: character_recognition_accuracy
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/license-plate-recognition-barrier-0007.yml b/tools/accuracy_checker/configs/license-plate-recognition-barrier-0007.yml
index 4ae2d870ae9..c5f3b822d03 100644
--- a/tools/accuracy_checker/configs/license-plate-recognition-barrier-0007.yml
+++ b/tools/accuracy_checker/configs/license-plate-recognition-barrier-0007.yml
@@ -8,7 +8,6 @@ models:
         model:   public/license-plate-recognition-barrier-0007/FP32/license-plate-recognition-barrier-0007.xml
         weights: public/license-plate-recognition-barrier-0007/FP32/license-plate-recognition-barrier-0007.bin
         adapter: lpr
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,11 @@ models:
         model:   public/license-plate-recognition-barrier-0007/FP16/license-plate-recognition-barrier-0007.xml
         weights: public/license-plate-recognition-barrier-0007/FP16/license-plate-recognition-barrier-0007.bin
         adapter: lpr
-        cpu_extensions: AUTO
 
     datasets:
       - name: synthetic_chinese_license_plates
 
-        preprocessing:
-          - type: resize
-            dst_width: 94
-            dst_height: 24
-
         metrics:
           - type: character_recognition_accuracy
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mask_rcnn_inception_resnet_v2_atrous_coco.yml b/tools/accuracy_checker/configs/mask_rcnn_inception_resnet_v2_atrous_coco.yml
index 3f963f7ffbf..3e3b6d9378a 100644
--- a/tools/accuracy_checker/configs/mask_rcnn_inception_resnet_v2_atrous_coco.yml
+++ b/tools/accuracy_checker/configs/mask_rcnn_inception_resnet_v2_atrous_coco.yml
@@ -11,11 +11,10 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
-
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
       - framework: dlsdk
         tags:
           - FP16
@@ -25,19 +24,16 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
     datasets:
       - name: ms_coco_mask_rcnn_short_91_classes
-        preprocessing:
-          - type: resize
-            size: 800
-        postprocessing:
-          - type: resize_prediction_boxes
 
         metrics:
           - type: coco_orig_segm_precision
           - type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mask_rcnn_inception_v2_coco.yml b/tools/accuracy_checker/configs/mask_rcnn_inception_v2_coco.yml
index 1926b37e29a..1bd2acc0b37 100644
--- a/tools/accuracy_checker/configs/mask_rcnn_inception_v2_coco.yml
+++ b/tools/accuracy_checker/configs/mask_rcnn_inception_v2_coco.yml
@@ -10,10 +10,10 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
       - framework: dlsdk
         tags:
@@ -24,19 +24,16 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
     datasets:
       - name: ms_coco_mask_rcnn_short_91_classes
-        preprocessing:
-          - type: resize
-            size: 800
-        postprocessing:
-          - type: resize_prediction_boxes
 
         metrics:
           - type: coco_orig_segm_precision
           - type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mask_rcnn_resnet101_atrous_coco.yml b/tools/accuracy_checker/configs/mask_rcnn_resnet101_atrous_coco.yml
index 6598c1deed3..96f8d4f8da3 100644
--- a/tools/accuracy_checker/configs/mask_rcnn_resnet101_atrous_coco.yml
+++ b/tools/accuracy_checker/configs/mask_rcnn_resnet101_atrous_coco.yml
@@ -11,10 +11,10 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
       - framework: dlsdk
         tags:
@@ -25,19 +25,16 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
     datasets:
       - name: ms_coco_mask_rcnn_short_91_classes
-        preprocessing:
-          - type: resize
-            size: 800
-        postprocessing:
-          - type: resize_prediction_boxes
 
         metrics:
           - type: coco_orig_segm_precision
           - type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mask_rcnn_resnet50_atrous_coco.yml b/tools/accuracy_checker/configs/mask_rcnn_resnet50_atrous_coco.yml
index 46435658fdd..1382f5f19b9 100644
--- a/tools/accuracy_checker/configs/mask_rcnn_resnet50_atrous_coco.yml
+++ b/tools/accuracy_checker/configs/mask_rcnn_resnet50_atrous_coco.yml
@@ -11,10 +11,10 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
       - framework: dlsdk
         tags:
@@ -25,19 +25,15 @@ models:
           type: mask_rcnn
           detection_out: reshape_do_2d
           raw_masks_out: masks
-        cpu_extensions: AUTO
         inputs:
           - name: image_info
-            type: IMAGE_INFO
+            type: CONST_INPUT
+            value: [[800, 1365, 1]]
 
     datasets:
       - name: ms_coco_mask_rcnn_short_91_classes
-        preprocessing:
-          - type: resize
-            size: 800
-        postprocessing:
-          - type: resize_prediction_boxes
-
         metrics:
           - type: coco_orig_segm_precision
           - type: coco_orig_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-ssd.yml b/tools/accuracy_checker/configs/mobilenet-ssd.yml
index e03439346ff..87c10ed63eb 100644
--- a/tools/accuracy_checker/configs/mobilenet-ssd.yml
+++ b/tools/accuracy_checker/configs/mobilenet-ssd.yml
@@ -24,7 +24,6 @@ models:
         model:   public/mobilenet-ssd/FP32/mobilenet-ssd.xml
         weights: public/mobilenet-ssd/FP32/mobilenet-ssd.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -32,7 +31,6 @@ models:
         model:   public/mobilenet-ssd/FP16/mobilenet-ssd.xml
         weights: public/mobilenet-ssd/FP16/mobilenet-ssd.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: VOC2012
@@ -41,3 +39,5 @@ models:
             size: 300
         postprocessing:
           - type: resize_prediction_boxes
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v1-0.25-128.yml b/tools/accuracy_checker/configs/mobilenet-v1-0.25-128.yml
index feaca0b2426..a9993c28cf7 100644
--- a/tools/accuracy_checker/configs/mobilenet-v1-0.25-128.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v1-0.25-128.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 128
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v1-0.50-160.yml b/tools/accuracy_checker/configs/mobilenet-v1-0.50-160.yml
index e867d6edca7..b0f3c4ac40f 100644
--- a/tools/accuracy_checker/configs/mobilenet-v1-0.50-160.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v1-0.50-160.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 160
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v1-0.50-224.yml b/tools/accuracy_checker/configs/mobilenet-v1-0.50-224.yml
index dbfad1eae21..addd6f191c9 100644
--- a/tools/accuracy_checker/configs/mobilenet-v1-0.50-224.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v1-0.50-224.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v1-1.0-224-tf.yml b/tools/accuracy_checker/configs/mobilenet-v1-1.0-224-tf.yml
index 8e9d94935c6..02c6e37144a 100644
--- a/tools/accuracy_checker/configs/mobilenet-v1-1.0-224-tf.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v1-1.0-224-tf.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v1-1.0-224.yml b/tools/accuracy_checker/configs/mobilenet-v1-1.0-224.yml
index 0cf200d96be..3ba7c7f3fab 100644
--- a/tools/accuracy_checker/configs/mobilenet-v1-1.0-224.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v1-1.0-224.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v2-1.0-224.yml b/tools/accuracy_checker/configs/mobilenet-v2-1.0-224.yml
index 99ef1f0061e..d3365674fad 100644
--- a/tools/accuracy_checker/configs/mobilenet-v2-1.0-224.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v2-1.0-224.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v2-1.4-224.yml b/tools/accuracy_checker/configs/mobilenet-v2-1.4-224.yml
index 28fe8969817..4a6761b73e6 100644
--- a/tools/accuracy_checker/configs/mobilenet-v2-1.4-224.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v2-1.4-224.yml
@@ -41,3 +41,5 @@ models:
             central_fraction: 0.875
           - type: resize
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v2-pytorch.yml b/tools/accuracy_checker/configs/mobilenet-v2-pytorch.yml
index dc1d3ee2d08..9f314c696f0 100644
--- a/tools/accuracy_checker/configs/mobilenet-v2-pytorch.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v2-pytorch.yml
@@ -15,7 +15,7 @@ models:
         reader: pillow_imread
 
         # In order to be used by model, images must be:
-        # 1) Resized to 256x256 with bilinear interpolation 
+        # 1) Resized to 256x256 with bilinear interpolation
         # 2) Cropped central part 224x224
         # 3) Normalized by 255
         # 4) Normalized by (0.229, 0.224, 0.225) with mean values (0.485, 0.456, 0.406)
@@ -25,7 +25,7 @@ models:
             aspect_ratio_scale: greater
             use_pillow: true
             interpolation: BILINEAR
-          
+
           - type: crop
             size: 224
             use_pillow: true
@@ -34,10 +34,10 @@ models:
             std: 255
 
           - type: normalization
-            mean: (0.485, 0.456, 0.406) 
+            mean: (0.485, 0.456, 0.406)
             std: (0.229, 0.224, 0.225)
 
-        # Using accuracy metric, achieved result of public model - 71.8
+            # Using accuracy metric, achieved result of public model - 71.8
 
   - name: mobilenet_v2_pytorch
 
@@ -49,7 +49,7 @@ models:
         model:   public/mobilenet-v2-pytorch/FP32/mobilenet-v2-pytorch.xml
         weights: public/mobilenet-v2-pytorch/FP32/mobilenet-v2-pytorch.bin
         adapter: classification
-      
+
       - framework: dlsdk
         tags:
           - FP16
@@ -64,15 +64,17 @@ models:
         # Image channels must be swapped, because "pillow_imread" reads in RGB, but converted model expect BGR
         preprocessing:
           - type: bgr_to_rgb
-          
+
           - type: resize
             size: 256
             aspect_ratio_scale: greater
             use_pillow: true
             interpolation: BILINEAR
-          
+
           - type: crop
             size: 224
             use_pillow: true
 
-        # Using accuracy metric, achieved result of public model - 71.8
+            # Using accuracy metric, achieved result of public model - 71.8
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenet-v2.yml b/tools/accuracy_checker/configs/mobilenet-v2.yml
index 454c3c2f636..9a9b7eb0380 100644
--- a/tools/accuracy_checker/configs/mobilenet-v2.yml
+++ b/tools/accuracy_checker/configs/mobilenet-v2.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v1-tf-0001.yml b/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v1-tf-0001.yml
deleted file mode 100644
index 819d32e1738..00000000000
--- a/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v1-tf-0001.yml
+++ /dev/null
@@ -1,27 +0,0 @@
-models:
-  - name: mobilenetv2-int8-sparse-v1-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/mobilenetv2-int8-sparse-v1-tf-0001/FP32/mobilenetv2-int8-sparse-v1-tf-0001.xml
-        weights: intel/mobilenetv2-int8-sparse-v1-tf-0001/FP32/mobilenetv2-int8-sparse-v1-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-    datasets:
-      - name: imagenet_1001_classes
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v2-tf-0001.yml b/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v2-tf-0001.yml
deleted file mode 100644
index 8173fa91ee1..00000000000
--- a/tools/accuracy_checker/configs/mobilenetv2-int8-sparse-v2-tf-0001.yml
+++ /dev/null
@@ -1,28 +0,0 @@
-models:
-  - name: mobilenetv2-int8-sparse-v2-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/mobilenetv2-int8-sparse-v2-tf-0001/FP32/mobilenetv2-int8-sparse-v2-tf-0001.xml
-        weights: intel/mobilenetv2-int8-sparse-v2-tf-0001/FP32/mobilenetv2-int8-sparse-v2-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-    datasets:
-      - name: imagenet_1001_classes
-
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/mobilenetv2-int8-tf-0001.yml b/tools/accuracy_checker/configs/mobilenetv2-int8-tf-0001.yml
deleted file mode 100644
index 953ca511b06..00000000000
--- a/tools/accuracy_checker/configs/mobilenetv2-int8-tf-0001.yml
+++ /dev/null
@@ -1,28 +0,0 @@
-models:
-  - name: mobilenetv2-int8-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/mobilenetv2-int8-tf-0001/FP32/mobilenetv2-int8-tf-0001.xml
-        weights: intel/mobilenetv2-int8-tf-0001/FP32/mobilenetv2-int8-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-    datasets:
-      - name: imagenet_1001_classes
-
-        preprocessing:
-        - type: crop
-          central_fraction: 0.875
-        - type: resize
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/mtcnn-o.yml b/tools/accuracy_checker/configs/mtcnn-o.yml
new file mode 100644
index 00000000000..4b2c11f6186
--- /dev/null
+++ b/tools/accuracy_checker/configs/mtcnn-o.yml
@@ -0,0 +1,234 @@
+evaluations:
+  - name: mtcnn-o
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          model:   public/mtcnn-p/mtcnn-p.prototxt
+          weights: public/mtcnn-p/mtcnn-p.prototxt
+          outputs:
+            probability_out: prob1
+            region_out: conv4-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+            - type: pyramid
+              min_size: 10
+              factor: 0.79
+          adapter:
+            type: mtcnn_p
+            probability_out: prob1
+            region_out: conv4-2
+            regions_format: hw
+
+          rnet:
+            model:   public/mtcnn-r/mtcnn-r.prototxt
+            weights: public/mtcnn-r/mtcnn-r.prototxt
+            outputs:
+              probability_out: prob1
+              region_out: conv5-2
+            inputs:
+              - name: data
+                type: INPUT
+                layout: NCWH
+            preprocessing:
+              - type: bgr_to_rgb
+          onet:
+            model:   public/mtcnn-o/mtcnn-o.prototxt
+            weights: public/mtcnn-o/mtcnn-o.prototxt
+            outputs:
+              probability_out: prob1
+              region_out: conv6-2
+            inputs:
+              - name: data
+                type: INPUT
+                layout: NCWH
+            preprocessing:
+              - type: bgr_to_rgb
+
+      launchers:
+        - framework: caffe
+
+      datasets:
+        - name: wider
+
+          preprocessing:
+            - type: normalization
+              mean: 127.5
+              std: 128
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+  - name: mtcnn-o
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          model:   public/mtcnn-p/FP32/mtcnn-p.xml
+          weights: public/mtcnn-p/FP32/mtcnn-p.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv4-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+            - type: pyramid
+              min_size: 10
+              factor: 0.79
+
+        rnet:
+          model:   public/mtcnn-r/FP32/mtcnn-r.xml
+          weights: public/mtcnn-r/FP32/mtcnn-r.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv5-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+        onet:
+          model:   public/mtcnn-o/FP32/mtcnn-o.xml
+          weights: public/mtcnn-o/FP32/mtcnn-o.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv6-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: wider
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+  - name: mtcnn-o
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          model:   public/mtcnn-p/FP16/mtcnn-p.xml
+          weights: public/mtcnn-p/FP16/mtcnn-p.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv4-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+            - type: pyramid
+              min_size: 10
+              factor: 0.79
+
+        rnet:
+          model:   public/mtcnn-r/FP16/mtcnn-r.xml
+          weights: public/mtcnn-r/FP16/mtcnn-r.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv5-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+        onet:
+          model:   public/mtcnn-o/FP16/mtcnn-o.xml
+          weights: public/mtcnn-o/FP16/mtcnn-o.bin
+          outputs:
+            probability_out: prob1
+            region_out: conv6-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: wider
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mtcnn-p.yml b/tools/accuracy_checker/configs/mtcnn-p.yml
new file mode 100644
index 00000000000..5f28e4972f6
--- /dev/null
+++ b/tools/accuracy_checker/configs/mtcnn-p.yml
@@ -0,0 +1,107 @@
+models:
+  - name: mtcnn-p
+
+    launchers:
+      - framework: caffe
+        model:   public/mtcnn-p/mtcnn-p.prototxt
+        weights: public/mtcnn-p/mtcnn-p.caffemodel
+        inputs:
+          - name: data
+            type: INPUT
+            layout: NCWH
+        adapter:
+          type: mtcnn_p
+          probability_out: prob1
+          region_out: conv4-2
+        allow_reshape_input: True
+
+    datasets:
+      - name: wider
+
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: pyramid
+            min_size: 20
+            factor: 0.709
+          - type: normalization
+            mean: 127.5
+            std: 128
+
+        postprocessing:
+          - type: cast_to_int
+          - type: filter
+            apply_to: annotation
+            height_range: 60
+            is_empty: True
+          - type: filter
+            min_confidence: 0.99
+            apply_to: prediction
+            remove_filtered: True
+
+        metrics:
+          - type: map
+            ignore_difficult: True
+            include_boundaries: False
+            allow_multiple_matches_per_ignored: False
+            distinct_conf: False
+
+  - name: mtcnn-p
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/mtcnn-p/FP32/mtcnn-p.xml
+        weights: public/mtcnn-p/FP32/mtcnn-p.bin
+        inputs:
+          - name: data
+            type: INPUT
+            layout: NCWH
+        adapter:
+          type: mtcnn_p
+          probability_out: prob1
+          region_out: conv4-2
+        allow_reshape_input: True
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/mtcnn-p/FP16/mtcnn-p.xml
+        weights: public/mtcnn-p/FP16/mtcnn-p.bin
+        inputs:
+          - name: data
+            type: INPUT
+            layout: NCWH
+        adapter:
+          type: mtcnn_p
+          probability_out: prob1
+          region_out: conv4-2
+        allow_reshape_input: True
+
+    datasets:
+      - name: wider
+
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: pyramid
+            min_size: 20
+            factor: 0.709
+
+        postprocessing:
+          - type: cast_to_int
+          - type: filter
+            apply_to: annotation
+            height_range: 60
+            is_empty: True
+          - type: filter
+            min_confidence: 0.99
+            apply_to: prediction
+            remove_filtered: True
+
+        metrics:
+          - type: map
+            ignore_difficult: True
+            include_boundaries: False
+            allow_multiple_matches_per_ignored: False
+            distinct_conf: False
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/mtcnn-r.yml b/tools/accuracy_checker/configs/mtcnn-r.yml
new file mode 100644
index 00000000000..3f5618a7447
--- /dev/null
+++ b/tools/accuracy_checker/configs/mtcnn-r.yml
@@ -0,0 +1,152 @@
+evaluations:
+  - name: mtcnn-r
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          predictions: pnet_predictions.pickle
+
+        rnet:
+          model:   public/mtcnn-r/mtcnn-r.prototxt
+          weights: public/mtcnn-r/mtcnn-r.caffemodel
+          outputs:
+            probability_out: prob1
+            region_out: conv5-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+      launchers:
+        - framework: caffe
+
+      datasets:
+        - name: wider
+
+          preprocessing:
+            - type: normalization
+              mean: 127.5
+              std: 128
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+  - name: mtcnn-r
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          predictions: pnet_predictions.pickle
+
+        rnet:
+          model:   public/mtcnn-r/FP32/mtcnn-r.xml
+          weights: public/mtcnn-r/FP32/mtcnn-r.xml
+          outputs:
+            probability_out: prob1
+            region_out: conv5-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: wider
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+  - name: mtcnn-r
+    module: custom_evaluators.mtcnn_evaluator.MTCNNEvaluator
+    module_config:
+      network_info:
+        pnet:
+          predictions: pnet_predictions.pickle
+
+        rnet:
+          model:   public/mtcnn-r/FP16/mtcnn-r.xml
+          weights: public/mtcnn-r/FP16/mtcnn-r.xml
+          outputs:
+            probability_out: prob1
+            region_out: conv5-2
+          inputs:
+            - name: data
+              type: INPUT
+              layout: NCWH
+          preprocessing:
+            - type: bgr_to_rgb
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: wider
+
+          postprocessing:
+            - type: filter
+              apply_to: prediction
+              is_empty: True
+            - type: filter
+              height_range: 60
+              apply_to: annotation
+
+          metrics:
+            - type: recall
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+            - type: map
+              ignore_difficult: True
+              include_boundaries: True
+              allow_multiple_matches_per_ignored: True
+              distinct_conf: False
+
+global_definitions: ../dataset_dfinitions.yml
diff --git a/tools/accuracy_checker/configs/octave-densenet-121-0.125.yml b/tools/accuracy_checker/configs/octave-densenet-121-0.125.yml
index 03eda9f3cfb..5185ef6258b 100644
--- a/tools/accuracy_checker/configs/octave-densenet-121-0.125.yml
+++ b/tools/accuracy_checker/configs/octave-densenet-121-0.125.yml
@@ -6,7 +6,7 @@ models:
       - framework: mxnet
         model: public/densenet-121-0.125/checkpoint-0-0000.params
         adapter: classification
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -36,7 +36,7 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 76.1 / 93.0 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 76.1 / 93.0 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-densenet-121-0.125
@@ -48,7 +48,6 @@ models:
         model:   public/octave-densenet-121-0.125/FP32/octave-densenet-121-0.125.xml
         weights: public/octave-densenet-121-0.125/FP32/octave-densenet-121-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -70,4 +69,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 76.1 / 93.0 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 76.1 / 93.0 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnet-101-0.125.yml b/tools/accuracy_checker/configs/octave-resnet-101-0.125.yml
index 3a83061b690..3682a6785f0 100644
--- a/tools/accuracy_checker/configs/octave-resnet-101-0.125.yml
+++ b/tools/accuracy_checker/configs/octave-resnet-101-0.125.yml
@@ -6,8 +6,7 @@ models:
       - framework: mxnet
         model: public/octave-resnet-101-0.125/checkpoint-0-0000.params
         adapter: classification
-        cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -37,7 +36,7 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 79.2 / 94.4 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 79.2 / 94.4 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnet-101-0.125
@@ -49,17 +48,14 @@ models:
         model:   public/octave-resnet-101-0.125/FP32/octave-resnet-101-0.125.xml
         weights: public/octave-resnet-101-0.125/FP32/octave-resnet-101-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
 
       - framework: dlsdk
-        device: GPU
         tags:
           - FP16
         model:   public/octave-resnet-101-0.125/FP16/octave-resnet-101-0.125.xml
         weights: public/octave-resnet-101-0.125/FP16/octave-resnet-101-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -74,4 +70,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 79.2 / 94.4 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 79.2 / 94.4 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnet-200-0.125.yml b/tools/accuracy_checker/configs/octave-resnet-200-0.125.yml
index 8baee9ab483..3ae8143221f 100644
--- a/tools/accuracy_checker/configs/octave-resnet-200-0.125.yml
+++ b/tools/accuracy_checker/configs/octave-resnet-200-0.125.yml
@@ -8,7 +8,7 @@ models:
         model: public/octave-resnet-200-0.125/checkpoint-0-0000.params
         adapter: classification
         cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -38,38 +38,25 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 80.0 / 94.9 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 80.0 / 94.9 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnet-200-0.125
 
     launchers:
       - framework: dlsdk
-        device: CPU
         tags:
           - FP32
         model:   public/octave-resnet-200-0.125/FP32/octave-resnet-200-0.125.xml
         weights: public/octave-resnet-200-0.125/FP32/octave-resnet-200-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
-
-      - framework: dlsdk
-        device: GPU
-        tags:
-          - FP32
-        model: octave-resnet-200-0.125/FP32/octave-resnet-200-0.125.xml
-        weights: octave-resnet-200-0.125/FP32/octave-resnet-200-0.125.bin
-        adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
-        device: GPU
         tags:
           - FP16
-        model: octave-resnet-200-0.125/FP16/octave-resnet-200-0.125.xml
-        weights: octave-resnet-200-0.125/FP16/octave-resnet-200-0.125.bin
+        model:   public/octave-resnet-200-0.125/FP16/octave-resnet-200-0.125.xml
+        weights: public/octave-resnet-200-0.125/FP16/octave-resnet-200-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -84,4 +71,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 80.0 / 94.9 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 80.0 / 94.9 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnet-26-0.25.yml b/tools/accuracy_checker/configs/octave-resnet-26-0.25.yml
index 7f39eceb098..0eb67a4af4a 100644
--- a/tools/accuracy_checker/configs/octave-resnet-26-0.25.yml
+++ b/tools/accuracy_checker/configs/octave-resnet-26-0.25.yml
@@ -7,7 +7,7 @@ models:
         model: public/resnet-26-0.250/checkpoint-0-0000.params
         adapter: classification
         cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -37,7 +37,7 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 76.1 / 92.6 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 76.1 / 92.6 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnet-26-0.25
@@ -49,7 +49,6 @@ models:
         model:   public/octave-resnet-26-0.25/FP32/octave-resnet-26-0.25.xml
         weights: public/octave-resnet-26-0.25/FP32/octave-resnet-26-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -57,7 +56,6 @@ models:
         model:   public/octave-resnet-26-0.25/FP16/octave-resnet-26-0.25.xml
         weights: public/octave-resnet-26-0.25/FP16/octave-resnet-26-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -72,4 +70,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 76.1 / 92.6 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 76.1 / 92.6 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnet-50-0.125.yml b/tools/accuracy_checker/configs/octave-resnet-50-0.125.yml
index b1050e3bd19..8ffd45b207f 100644
--- a/tools/accuracy_checker/configs/octave-resnet-50-0.125.yml
+++ b/tools/accuracy_checker/configs/octave-resnet-50-0.125.yml
@@ -6,8 +6,7 @@ models:
       - framework: mxnet
         model: public/octave-resnet-50-0.125/checkpoint-0-0000.params
         adapter: classification
-        cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -37,7 +36,7 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnet-50-0.125
@@ -70,4 +69,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnext-101-0.25.yml b/tools/accuracy_checker/configs/octave-resnext-101-0.25.yml
index 4f2b433a283..899f58adbb9 100644
--- a/tools/accuracy_checker/configs/octave-resnext-101-0.25.yml
+++ b/tools/accuracy_checker/configs/octave-resnext-101-0.25.yml
@@ -6,7 +6,7 @@ models:
       - framework: mxnet
         model: public/octave-resnext-101-0.25/checkpoint-0-0000.params
         adapter: classification
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -28,9 +28,9 @@ models:
 
           - type: normalization
             mean: (124,117,104)
-            std: 59.88  
+            std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 79.6 / 94.5 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 79.6 / 94.5 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnext-101-0.25
@@ -42,7 +42,6 @@ models:
         model:   public/octave-resnext-101-0.25/FP32/octave-resnext-101-0.25.xml
         weights: public/octave-resnext-101-0.25/FP32/octave-resnext-101-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -50,7 +49,6 @@ models:
         model:   public/octave-resnext-101-0.25/FP16/octave-resnext-101-0.25.xml
         weights: public/octave-resnext-101-0.25/FP16/octave-resnext-101-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -65,4 +63,5 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 79.6 / 94.5 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 79.6 / 94.5 (top 1 and top 5 respectively)
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-resnext-50-0.25.yml b/tools/accuracy_checker/configs/octave-resnext-50-0.25.yml
index 49f4992a94a..008cfb482b2 100644
--- a/tools/accuracy_checker/configs/octave-resnext-50-0.25.yml
+++ b/tools/accuracy_checker/configs/octave-resnext-50-0.25.yml
@@ -7,8 +7,7 @@ models:
         device: CPU
         model: public/octave-resnext-50-0.25/checkpoint-0-0000.params
         adapter: classification
-        cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -32,7 +31,7 @@ models:
             mean: (124,117,104)
             std: 59.88
 
-        # Using accuracy metric, achieved result of public model - 78.8 / 94.2 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 78.8 / 94.2 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-resnext-50-0.25
@@ -44,7 +43,6 @@ models:
         model:   public/octave-resnext-50-0.25/FP32/octave-resnext-50-0.25.xml
         weights: public/octave-resnext-50-0.25/FP32/octave-resnext-50-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -52,7 +50,6 @@ models:
         model:   public/octave-resnext-50-0.25/FP16/octave-resnext-50-0.25.xml
         weights: public/octave-resnext-50-0.25/FP16/octave-resnext-50-0.25.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -67,4 +64,6 @@ models:
           - type: crop
             size: 224
 
-        # Using accuracy metric, achieved result of public model - 78.8 / 94.2 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 78.8 / 94.2 (top 1 and top 5 respectively)
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/octave-se-resnet-50-0.125.yml b/tools/accuracy_checker/configs/octave-se-resnet-50-0.125.yml
index 4b51e367c7a..8246697dfcf 100644
--- a/tools/accuracy_checker/configs/octave-se-resnet-50-0.125.yml
+++ b/tools/accuracy_checker/configs/octave-se-resnet-50-0.125.yml
@@ -7,8 +7,7 @@ models:
         device: CPU
         model: public/octave-se-resnet-50-0.125/checkpoint-0-0000.params
         adapter: classification
-        cpu_extensions: AUTO
-        inputs: 
+        inputs:
           - name: 'data'
             type: INPUT
             shape: 3,224,224
@@ -30,38 +29,25 @@ models:
           - type: normalization
             mean: (124,117,104)
             std: 59.88
-        # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
+            # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
 
   # DLSDK inference
   - name: octave-se-resnet-50-0.125
 
     launchers:
       - framework: dlsdk
-        device: CPU
-        tags:
-          - FP32
-        model:   public/octave-se-resnet-50-0.125/FP32/octave-se-resnet-50-0.125.xml
-        weights: public/octave-se-resnet-50-0.125/FP32/octave-se-resnet-50-0.125.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-      - framework: dlsdk
-        device: GPU
         tags:
           - FP32
         model:   public/octave-se-resnet-50-0.125/FP32/octave-se-resnet-50-0.125.xml
         weights: public/octave-se-resnet-50-0.125/FP32/octave-se-resnet-50-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
       - framework: dlsdk
-        device: GPU
         tags:
           - FP16
         model:   public/octave-se-resnet-50-0.125/FP16/octave-se-resnet-50-0.125.xml
         weights: public/octave-se-resnet-50-0.125/FP16/octave-se-resnet-50-0.125.bin
         adapter: classification
-        cpu_extensions: AUTO
 
     datasets:
       - name: imagenet_1000_classes
@@ -74,5 +60,6 @@ models:
 
           - type: crop
             size: 224
+            # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
 
-        # Using accuracy metric, achieved result of public model - 78.2 / 93.9 (top 1 and top 5 respectively)
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/pedestrian-and-vehicle-detector-adas-0001.yml b/tools/accuracy_checker/configs/pedestrian-and-vehicle-detector-adas-0001.yml
index 1a9c0c906c0..458de50fc0d 100644
--- a/tools/accuracy_checker/configs/pedestrian-and-vehicle-detector-adas-0001.yml
+++ b/tools/accuracy_checker/configs/pedestrian-and-vehicle-detector-adas-0001.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.xml
         weights: intel/pedestrian-and-vehicle-detector-adas-0001/FP32/pedestrian-and-vehicle-detector-adas-0001.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.xml
         weights: intel/pedestrian-and-vehicle-detector-adas-0001/FP16/pedestrian-and-vehicle-detector-adas-0001.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/pedestrian-and-vehicle-detector-adas-0001/INT8/pedestrian-and-vehicle-detector-adas-0001.xml
-        weights: intel/pedestrian-and-vehicle-detector-adas-0001/INT8/pedestrian-and-vehicle-detector-adas-0001.bin
+          - FP32-INT8
+        model:   intel/pedestrian-and-vehicle-detector-adas-0001/FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.xml
+        weights: intel/pedestrian-and-vehicle-detector-adas-0001/FP32-INT8/pedestrian-and-vehicle-detector-adas-0001.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: pedestrian_and_vehicle_dataset
@@ -53,3 +50,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/pedestrian-detection-adas-0002.yml b/tools/accuracy_checker/configs/pedestrian-detection-adas-0002.yml
index 57f61a956bd..ef244d29038 100644
--- a/tools/accuracy_checker/configs/pedestrian-detection-adas-0002.yml
+++ b/tools/accuracy_checker/configs/pedestrian-detection-adas-0002.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.xml
         weights: intel/pedestrian-detection-adas-0002/FP32/pedestrian-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.xml
         weights: intel/pedestrian-detection-adas-0002/FP16/pedestrian-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/pedestrian-detection-adas-0002/INT8/pedestrian-detection-adas-0002.xml
-        weights: intel/pedestrian-detection-adas-0002/INT8/pedestrian-detection-adas-0002.bin
+          - FP32-INT8
+        model:   intel/pedestrian-detection-adas-0002/FP32-INT8/pedestrian-detection-adas-0002.xml
+        weights: intel/pedestrian-detection-adas-0002/FP32-INT8/pedestrian-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: pedestrian_detection_dataset
@@ -53,3 +50,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/pedestrian-detection-adas-binary-0001.yml b/tools/accuracy_checker/configs/pedestrian-detection-adas-binary-0001.yml
index 470e50b55b5..9a217e967d6 100644
--- a/tools/accuracy_checker/configs/pedestrian-detection-adas-binary-0001.yml
+++ b/tools/accuracy_checker/configs/pedestrian-detection-adas-binary-0001.yml
@@ -4,11 +4,10 @@ models:
     launchers:
       - framework: dlsdk
         tags:
-          - INT1
-        model:   intel/pedestrian-detection-adas-binary-0001/INT1/pedestrian-detection-adas-binary-0001.xml
-        weights: intel/pedestrian-detection-adas-binary-0001/INT1/pedestrian-detection-adas-binary-0001.bin
+          - FP32-INT1
+        model:   intel/pedestrian-detection-adas-binary-0001/FP32-INT1/pedestrian-detection-adas-binary-0001.xml
+        weights: intel/pedestrian-detection-adas-binary-0001/FP32-INT1/pedestrian-detection-adas-binary-0001.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: pedestrian_detection_dataset
@@ -37,3 +36,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-attributes-recognition-crossroad-0230.yml b/tools/accuracy_checker/configs/person-attributes-recognition-crossroad-0230.yml
index a73722de920..27875dc9e2c 100644
--- a/tools/accuracy_checker/configs/person-attributes-recognition-crossroad-0230.yml
+++ b/tools/accuracy_checker/configs/person-attributes-recognition-crossroad-0230.yml
@@ -20,6 +20,16 @@ models:
           type: person_attributes
           attributes_recognition_out: "453"
 
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-attributes-recognition-crossroad-0230/FP32-INT8/person-attributes-recognition-crossroad-0230.xml
+        weights: intel/person-attributes-recognition-crossroad-0230/FP32-INT8/person-attributes-recognition-crossroad-0230.bin
+        adapter:
+          type: person_attributes
+          attributes_recognition_out: "453"
+
+
     datasets:
       - name: person_8_attributes
 
@@ -33,3 +43,5 @@ models:
           - type: f1-score
             calculate_average: False
             presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-action-recognition-0005.yml b/tools/accuracy_checker/configs/person-detection-action-recognition-0005.yml
index bf772ccfcd1..20d4fa563a4 100644
--- a/tools/accuracy_checker/configs/person-detection-action-recognition-0005.yml
+++ b/tools/accuracy_checker/configs/person-detection-action-recognition-0005.yml
@@ -18,7 +18,6 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -36,13 +35,12 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/person-detection-action-recognition-0005/INT8/person-detection-action-recognition-0005.xml
-        weights: intel/person-detection-action-recognition-0005/INT8/person-detection-action-recognition-0005.bin
+          - FP32-INT8
+        model:   intel/person-detection-action-recognition-0005/FP32-INT8/person-detection-action-recognition-0005.xml
+        weights: intel/person-detection-action-recognition-0005/FP32-INT8/person-detection-action-recognition-0005.bin
         adapter:
           type: action_detection
           priorbox_out: mbox/priorbox
@@ -54,7 +52,6 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
 
     datasets:
       - name: action_detection_dataset_3_classes
@@ -98,3 +95,5 @@ models:
             prediction_source: action_prediction
             label_map: action_label_map
             ignore_label: 3
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-action-recognition-0006.yml b/tools/accuracy_checker/configs/person-detection-action-recognition-0006.yml
index 62e329629c2..6bda92af0f0 100644
--- a/tools/accuracy_checker/configs/person-detection-action-recognition-0006.yml
+++ b/tools/accuracy_checker/configs/person-detection-action-recognition-0006.yml
@@ -1,120 +1,118 @@
 models:
- - name: person-detection-action-recognition-0006
+  - name: person-detection-action-recognition-0006
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.xml
+        weights: intel/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.bin
+        adapter:
+          type: action_detection
+          multihead_net: True
+          loc_out: ActionNet/out_detection_loc
+          main_conf_out: ActionNet/out_detection_conf
+          add_conf_out_prefix: ActionNet/action_heads/out_head_
+          add_conf_out_suffix: _anchor_
+          head_sizes: [1, 4]
+          head_scales: [8, 16]
+          anchors: [[[58.670372, 26.17863728]],
+                    [[81.829632, 35.36],
+                     [107.651852, 45.8114572],
+                     [142.595732, 63.31491832],
+                     [201.107692, 93.5070856]]]
+          variance: [0.1, 0.1, 0.2, 0.2]
+          in_sizes: [400, 680]
+          num_action_classes: 6
+          detection_threshold: 0.3
+          action_scale: 16.0
 
-   launchers:
-     - framework: dlsdk
-       tags:
-         - FP32
-       model:   intel/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.xml
-       weights: intel/person-detection-action-recognition-0006/FP32/person-detection-action-recognition-0006.bin
-       adapter:
-         type: action_detection
-         multihead_net: True
-         loc_out: ActionNet/out_detection_loc
-         main_conf_out: ActionNet/out_detection_conf
-         add_conf_out_prefix: ActionNet/action_heads/out_head_
-         add_conf_out_suffix: _anchor_
-         head_sizes: [1, 4]
-         head_scales: [8, 16]
-         anchors: [[[58.670372, 26.17863728]],
-                   [[81.829632, 35.36],
-                    [107.651852, 45.8114572],
-                    [142.595732, 63.31491832],
-                    [201.107692, 93.5070856]]]
-         variance: [0.1, 0.1, 0.2, 0.2]
-         in_sizes: [400, 680]
-         num_action_classes: 6
-         detection_threshold: 0.3
-         action_scale: 16.0
-       cpu_extensions: AUTO
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.xml
+        weights: intel/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.bin
+        adapter:
+          type: action_detection
+          multihead_net: True
+          loc_out: ActionNet/out_detection_loc
+          main_conf_out: ActionNet/out_detection_conf
+          add_conf_out_prefix: ActionNet/action_heads/out_head_
+          add_conf_out_suffix: _anchor_
+          head_sizes: [1, 4]
+          head_scales: [8, 16]
+          anchors: [[[58.670372, 26.17863728]],
+                    [[81.829632, 35.36],
+                     [107.651852, 45.8114572],
+                     [142.595732, 63.31491832],
+                     [201.107692, 93.5070856]]]
+        variance: [0.1, 0.1, 0.2, 0.2]
+        in_sizes: [400, 680]
+        num_action_classes: 6
+        detection_threshold: 0.3
+        action_scale: 16.0
 
-     - framework: dlsdk
-       tags:
-         - FP16
-       model:   intel/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.xml
-       weights: intel/person-detection-action-recognition-0006/FP16/person-detection-action-recognition-0006.bin
-       adapter:
-         type: action_detection
-         multihead_net: True
-         loc_out: ActionNet/out_detection_loc
-         main_conf_out: ActionNet/out_detection_conf
-         add_conf_out_prefix: ActionNet/action_heads/out_head_
-         add_conf_out_suffix: _anchor_
-         head_sizes: [1, 4]
-         head_scales: [8, 16]
-         anchors: [[[58.670372, 26.17863728]],
-                   [[81.829632, 35.36],
-                    [107.651852, 45.8114572],
-                    [142.595732, 63.31491832],
-                    [201.107692, 93.5070856]]]
-         variance: [0.1, 0.1, 0.2, 0.2]
-         in_sizes: [400, 680]
-         num_action_classes: 6
-         detection_threshold: 0.3
-         action_scale: 16.0
-       cpu_extensions: AUTO
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-detection-action-recognition-0006/FP32-INT8/person-detection-action-recognition-0006.xml
+        weights: intel/person-detection-action-recognition-0006/FP32-INT8/person-detection-action-recognition-0006.bin
+        adapter:
+          type: action_detection
+          multihead_net: True
+          loc_out: ActionNet/out_detection_loc
+          main_conf_out: ActionNet/out_detection_conf
+          add_conf_out_prefix: ActionNet/action_heads/out_head_
+          add_conf_out_suffix: _anchor_
+          head_sizes: [1, 4]
+          head_scales: [8, 16]
+          anchors: [[[58.670372, 26.17863728]],
+                    [[81.829632, 35.36],
+                     [107.651852, 45.8114572],
+                     [142.595732, 63.31491832],
+                     [201.107692, 93.5070856]]]
+          variance: [0.1, 0.1, 0.2, 0.2]
+          in_sizes: [400, 680]
+          num_action_classes: 6
+          detection_threshold: 0.3
+          action_scale: 16.0
 
-     - framework: dlsdk
-       tags:
-         - INT8
-       model:   intel/person-detection-action-recognition-0006/INT8/person-detection-action-recognition-0006.xml
-       weights: intel/person-detection-action-recognition-0006/INT8/person-detection-action-recognition-0006.bin
-       adapter:
-         type: action_detection
-         multihead_net: True
-         loc_out: ActionNet/out_detection_loc
-         main_conf_out: ActionNet/out_detection_conf
-         add_conf_out_prefix: ActionNet/action_heads/out_head_
-         add_conf_out_suffix: _anchor_
-         head_sizes: [1, 4]
-         head_scales: [8, 16]
-         anchors: [[[58.670372, 26.17863728]],
-                   [[81.829632, 35.36],
-                    [107.651852, 45.8114572],
-                    [142.595732, 63.31491832],
-                    [201.107692, 93.5070856]]]
-         variance: [0.1, 0.1, 0.2, 0.2]
-         in_sizes: [400, 680]
-         num_action_classes: 6
-         detection_threshold: 0.3
-         action_scale: 16.0
-       cpu_extensions: AUTO
+    datasets:
+      - name: action_detection_dataset_6_classes
 
-   datasets:
-   - name: action_detection_dataset_6_classes
+        preprocessing:
+          - type: resize
+            dst_width: 680
+            dst_height: 400
 
-     preprocessing:
-        - type: resize
-          dst_width: 680
-          dst_height: 400
+        postprocessing:
+          - type: soft_nms
+            sigma: 0.6
+            min_score: 0.3
+            keep_top_k: 200
 
-     postprocessing:
-       - type: soft_nms
-         sigma: 0.6
-         min_score: 0.3
-         keep_top_k: 200
+          - type: filter
+            is_empty: True
+            apply_to: prediction
+            remove_filtered: True
 
-       - type: filter
-         is_empty: True
-         apply_to: prediction
-         remove_filtered: True
+          - type: normalize_boxes
 
-       - type: normalize_boxes
+        metrics:
+          - type: map
+            name: class_agnostic@ap
+            ignore_difficult: False
+            include_boundaries: False
+            allow_multiple_matches_per_ignored: False
+            distinct_conf: True
+            annotation_source: person_annotation
+            prediction_source: class_agnostic_prediction
+            label_map: person_label_map
 
-     metrics:
-       - type: map
-         name: class_agnostic@ap
-         ignore_difficult: False
-         include_boundaries: False
-         allow_multiple_matches_per_ignored: False
-         distinct_conf: True
-         annotation_source: person_annotation
-         prediction_source: class_agnostic_prediction
-         label_map: person_label_map
+          - type: detection_accuracy
+            use_normalization: True
+            annotation_source: action_annotation
+            prediction_source: action_prediction
+            label_map: action_label_map
+            ignore_label: 6
 
-       - type: detection_accuracy
-         use_normalization: True
-         annotation_source: action_annotation
-         prediction_source: action_prediction
-         label_map: action_label_map
-         ignore_label: 6
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-action-recognition-teacher-0002.yml b/tools/accuracy_checker/configs/person-detection-action-recognition-teacher-0002.yml
index 56301b10380..e4eaccb65ba 100644
--- a/tools/accuracy_checker/configs/person-detection-action-recognition-teacher-0002.yml
+++ b/tools/accuracy_checker/configs/person-detection-action-recognition-teacher-0002.yml
@@ -18,7 +18,6 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -36,7 +35,23 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-detection-action-recognition-teacher-0002/FP32-INT8/person-detection-action-recognition-teacher-0002.xml
+        weights: intel/person-detection-action-recognition-teacher-0002/FP32-INT8/person-detection-action-recognition-teacher-0002.bin
+        adapter:
+          type: action_detection
+          priorbox_out: mbox/priorbox
+          loc_out: mbox_loc1/out/conv/flat
+          main_conf_out: mbox_main_conf/out/conv/flat/softmax/flat
+          add_conf_out_prefix: out/anchor
+          add_conf_out_count: 4
+          num_action_classes: 3
+          detection_threshold: 0.4
+          action_confidence_threshold: 0.75
+          action_scale: 3
 
     datasets:
       - name: action_detection_dataset_teacher
@@ -64,21 +79,22 @@ models:
             boxes_normalized: True
 
         metrics:
-         - type: map
-           name: class_agnostic@ap
-           ignore_difficult: False
-           include_boundaries: False
-           allow_multiple_matches_per_ignored: False
-           distinct_conf: True
-           annotation_source: person_annotation
-           prediction_source: class_agnostic_prediction
-           label_map: person_label_map
+          - type: map
+            name: class_agnostic@ap
+            ignore_difficult: False
+            include_boundaries: False
+            allow_multiple_matches_per_ignored: False
+            distinct_conf: True
+            annotation_source: person_annotation
+            prediction_source: class_agnostic_prediction
+            label_map: person_label_map
 
-         - type: detection_accuracy
-           use_normalization: True
-           annotation_source: action_annotation
-           prediction_source: action_prediction
-           label_map: action_label_map
-           fast_match: True
-           ignore_label: 3
+          - type: detection_accuracy
+            use_normalization: True
+            annotation_source: action_annotation
+            prediction_source: action_prediction
+            label_map: action_label_map
+            fast_match: True
+            ignore_label: 3
 
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-asl-0001.yml b/tools/accuracy_checker/configs/person-detection-asl-0001.yml
new file mode 100644
index 00000000000..c11699e3d06
--- /dev/null
+++ b/tools/accuracy_checker/configs/person-detection-asl-0001.yml
@@ -0,0 +1,43 @@
+models:
+  - name: person-detection-asl-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/person-detection-asl-0001/FP32/person-detection-asl-0001.xml
+        weights: intel/person-detection-asl-0001/FP32/person-detection-asl-0001.bin
+        adapter:
+          type: fcos_person
+          output_blob: 17701/Split.0
+          scale: 0.003125
+
+    datasets:
+      - name: mscoco_person_detection
+
+        preprocessing:
+          - type: resize
+            size: 320
+
+        postprocessing:
+          - type: resize_prediction_boxes
+          - type: filter
+            apply_to: annotation
+            height_range: 100
+            aspect_ratio: 0.666, 5
+            is_empty: True
+            min_visibility: partially occluded
+          - type: filter
+            apply_to: prediction
+            height_range: 100
+            is_empty: True
+            aspect_ratio: 0.666, 5
+
+        metrics:
+          - type: map
+            ignore_difficult: True
+            include_boundaries: True
+            allow_multiple_matches_per_ignored: False
+            distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-raisinghand-recognition-0001.yml b/tools/accuracy_checker/configs/person-detection-raisinghand-recognition-0001.yml
index 546b7905e73..eaf383bba23 100644
--- a/tools/accuracy_checker/configs/person-detection-raisinghand-recognition-0001.yml
+++ b/tools/accuracy_checker/configs/person-detection-raisinghand-recognition-0001.yml
@@ -18,7 +18,6 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -36,7 +35,23 @@ models:
           detection_threshold: 0.4
           action_confidence_threshold: 0.75
           action_scale: 3
-        cpu_extensions: AUTO
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-detection-raisinghand-recognition-0001/FP32-INT8/person-detection-raisinghand-recognition-0001.xml
+        weights: intel/person-detection-raisinghand-recognition-0001/FP32-INT8/person-detection-raisinghand-recognition-0001.bin
+        adapter:
+          type: action_detection
+          priorbox_out: mbox/priorbox
+          loc_out: mbox_loc1/out/conv/flat
+          main_conf_out: mbox_main_conf/out/conv/flat/softmax/flat
+          add_conf_out_prefix: out/anchor
+          add_conf_out_count: 4
+          num_action_classes: 2
+          detection_threshold: 0.4
+          action_confidence_threshold: 0.75
+          action_scale: 3
 
     datasets:
       - name: action_detection_dataset_raising_hand
@@ -80,3 +95,5 @@ models:
             prediction_source: action_prediction
             label_map: action_label_map
             ignore_label: 2
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-retail-0002.yml b/tools/accuracy_checker/configs/person-detection-retail-0002.yml
index 1ecbf3edc71..6ba9a290453 100644
--- a/tools/accuracy_checker/configs/person-detection-retail-0002.yml
+++ b/tools/accuracy_checker/configs/person-detection-retail-0002.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/person-detection-retail-0002/FP32/person-detection-retail-0002.xml
         weights: intel/person-detection-retail-0002/FP32/person-detection-retail-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: CONST_INPUT
@@ -20,12 +19,23 @@ models:
         model:   intel/person-detection-retail-0002/FP16/person-detection-retail-0002.xml
         weights: intel/person-detection-retail-0002/FP16/person-detection-retail-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
         inputs:
           - name: im_info
             type: CONST_INPUT
             value: [[544, 992, 0, 0, 0, 0]]
 
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-detection-retail-0002/FP32-INT8/person-detection-retail-0002.xml
+        weights: intel/person-detection-retail-0002/FP32-INT8/person-detection-retail-0002.bin
+        adapter: ssd
+        inputs:
+          - name: im_info
+            type: CONST_INPUT
+            value: [[544, 992, 0, 0, 0, 0]]
+
+
     datasets:
       - name: person_detection
 
@@ -67,3 +77,5 @@ models:
             include_boundaries: False
             allow_multiple_matches_per_ignored: False
             distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-detection-retail-0013.yml b/tools/accuracy_checker/configs/person-detection-retail-0013.yml
index 0731eb23663..52e0fd49f51 100644
--- a/tools/accuracy_checker/configs/person-detection-retail-0013.yml
+++ b/tools/accuracy_checker/configs/person-detection-retail-0013.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/person-detection-retail-0013/FP32/person-detection-retail-0013.xml
         weights: intel/person-detection-retail-0013/FP32/person-detection-retail-0013.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/person-detection-retail-0013/FP16/person-detection-retail-0013.xml
         weights: intel/person-detection-retail-0013/FP16/person-detection-retail-0013.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/person-detection-retail-0013/INT8/person-detection-retail-0013.xml
-        weights: intel/person-detection-retail-0013/INT8/person-detection-retail-0013.bin
+          - FP32-INT8
+        model:   intel/person-detection-retail-0013/FP32-INT8/person-detection-retail-0013.xml
+        weights: intel/person-detection-retail-0013/FP32-INT8/person-detection-retail-0013.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: person_detection
@@ -54,3 +51,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: False
             distinct_conf: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0031.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0031.yml
index c9c6f6b0e42..def8c657c64 100644
--- a/tools/accuracy_checker/configs/person-reidentification-retail-0031.yml
+++ b/tools/accuracy_checker/configs/person-reidentification-retail-0031.yml
@@ -18,26 +18,21 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/person-reidentification-retail-0031/INT8/person-reidentification-retail-0031.xml
-        weights: intel/person-reidentification-retail-0031/INT8/person-reidentification-retail-0031.bin
+          - FP32-INT8
+        model:   intel/person-reidentification-retail-0031/FP32-INT8/person-reidentification-retail-0031.xml
+        weights: intel/person-reidentification-retail-0031/FP32-INT8/person-reidentification-retail-0031.bin
         adapter: reid
 
     datasets:
       - name: market1501
         reader: pillow_imread
-        data_source: Market-1501-v15.09.15
-        annotation_conversion:
-          converter: market1501_reid
-          data_dir: Market-1501-v15.09.15
 
         preprocessing:
           - type: bgr_to_rgb
           - type: resize
             dst_width: 48
             dst_height: 96
-            use_pil: True
+            use_pillow: True
             interpolation: ANTIALIAS
 
         metrics:
@@ -46,3 +41,5 @@ models:
             top_k: 1
 
           - type: reid_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0076.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0076.yml
deleted file mode 100644
index 607b1f26cd6..00000000000
--- a/tools/accuracy_checker/configs/person-reidentification-retail-0076.yml
+++ /dev/null
@@ -1,44 +0,0 @@
-models:
-  - name: person-reidentification-retail-0076
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - FP32
-        model:   intel/person-reidentification-retail-0031/FP32/person-reidentification-retail-0076.xml
-        weights: intel/person-reidentification-retail-0031/FP32/person-reidentification-retail-0076.bin
-        adapter: reid
-
-      - framework: dlsdk
-        tags:
-          - FP16
-        model:   intel/person-reidentification-retail-0031/FP16/person-reidentification-retail-0076.xml
-        weights: intel/person-reidentification-retail-0031/FP16/person-reidentification-retail-0076.bin
-        adapter: reid
-
-      - framework: dlsdk
-        tags:
-          - INT8
-        device: CPU
-        model:   intel/person-reidentification-retail-0031/INT8/person-reidentification-retail-0076.xml
-        weights: intel/person-reidentification-retail-0031/INT8/person-reidentification-retail-0076.bin
-        adapter: reid
-
-    datasets:
-      - name: market1501
-        data_source: Market-1501-v15.09.15
-        annotation_conversion:
-          converter: market1501_reid
-          data_dir: Market-1501-v15.09.15
-
-        preprocessing:
-          - type: resize
-            dst_width: 128
-            dst_height: 384
-
-        metrics:
-          - name: rank@1
-            type: cmc
-            top_k: 1
-
-          - type: reid_map
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0079.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0079.yml
deleted file mode 100644
index 3fd8bfd48cf..00000000000
--- a/tools/accuracy_checker/configs/person-reidentification-retail-0079.yml
+++ /dev/null
@@ -1,44 +0,0 @@
-models:
-  - name: person-reidentification-retail-0079
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - FP32
-        model:   intel/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.xml
-        weights: intel/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.bin
-        adapter: reid
-
-      - framework: dlsdk
-        tags:
-          - FP16
-        model:   intel/person-reidentification-retail-0079/FP16/person-reidentification-retail-0079.xml
-        weights: intel/person-reidentification-retail-0079/FP16/person-reidentification-retail-0079.bin
-        adapter: reid
-
-      - framework: dlsdk
-        tags:
-          - INT8
-        device: CPU
-        model:  intel/person-reidentification-retail-0079/dldt/INT8/person-reidentification-retail-0079.xml
-        weights: intel/person-reidentification-retail-0079/0079/dldt/INT8/person-reidentification-retail-0079.bin
-        adapter: reid
-
-    datasets:
-      - name: market1501
-        data_source: Market-1501-v15.09.15
-        annotation_conversion:
-          converter: market1501_reid
-          data_dir: Market-1501-v15.09.15
-
-        preprocessing:
-          - type: resize
-            dst_width: 64
-            dst_height: 160
-
-        metrics:
-          - name: rank@1
-            type: cmc
-            top_k: 1
-
-          - type: reid_map
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0103.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0103.yml
new file mode 100644
index 00000000000..5dc771da28b
--- /dev/null
+++ b/tools/accuracy_checker/configs/person-reidentification-retail-0103.yml
@@ -0,0 +1,43 @@
+models:
+  - name: person-reidentification-retail-0103
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/person-reidentification-retail-0103/FP32/person-reidentification-retail-0103.xml
+        weights: intel/person-reidentification-retail-0103/FP32/person-reidentification-retail-0103.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/person-reidentification-retail-0103/FP16/person-reidentification-retail-0103.xml
+        weights: intel/person-reidentification-retail-0103/FP16/person-reidentification-retail-0103.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-reidentification-retail-0103/FP32-INT8/person-reidentification-retail-0103.xml
+        weights: intel/person-reidentification-retail-0103/FP32-INT8/person-reidentification-retail-0103.bin
+        adapter: reid
+
+    datasets:
+      - name: globalme-reid
+
+        preprocessing:
+          - type: resize
+            dst_width: 128
+            dst_height: 256
+            use_pillow: True
+            interpolation: BILINEAR
+
+        metrics:
+          - name: rank@1
+            type: cmc
+            top_k: 1
+
+          - type: reid_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0107.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0107.yml
new file mode 100644
index 00000000000..1e7af372010
--- /dev/null
+++ b/tools/accuracy_checker/configs/person-reidentification-retail-0107.yml
@@ -0,0 +1,43 @@
+models:
+  - name: person-reidentification-retail-0107
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/person-reidentification-retail-0107/FP32/person-reidentification-retail-0107.xml
+        weights: intel/person-reidentification-retail-0107/FP32/person-reidentification-retail-0107.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/person-reidentification-retail-0107/FP16/person-reidentification-retail-0107.xml
+        weights: intel/person-reidentification-retail-0107/FP16/person-reidentification-retail-0107.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-reidentification-retail-0107/FP32-INT8/person-reidentification-retail-0107.xml
+        weights: intel/person-reidentification-retail-0107/FP32-INT8/person-reidentification-retail-0107.bin
+        adapter: reid
+
+    datasets:
+      - name: globalme-reid
+
+        preprocessing:
+          - type: resize
+            dst_width: 128
+            dst_height: 256
+            use_pillow: True
+            interpolation: BILINEAR
+
+        metrics:
+          - name: rank@1
+            type: cmc
+            top_k: 1
+
+          - type: reid_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-reidentification-retail-0200.yml b/tools/accuracy_checker/configs/person-reidentification-retail-0200.yml
new file mode 100644
index 00000000000..16ba0a4766c
--- /dev/null
+++ b/tools/accuracy_checker/configs/person-reidentification-retail-0200.yml
@@ -0,0 +1,43 @@
+models:
+  - name: person-reidentification-retail-0200
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/person-reidentification-retail-0200/FP32/person-reidentification-retail-0200.xml
+        weights: intel/person-reidentification-retail-0200/FP32/person-reidentification-retail-0200.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/person-reidentification-retail-0200/FP16/person-reidentification-retail-0200.xml
+        weights: intel/person-reidentification-retail-0200/FP16/person-reidentification-retail-0200.bin
+        adapter: reid
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-reidentification-retail-0200/FP32-INT8/person-reidentification-retail-0200.xml
+        weights: intel/person-reidentification-retail-0200/FP32-INT8/person-reidentification-retail-0200.bin
+        adapter: reid
+
+    datasets:
+      - name: globalme-reid
+
+        preprocessing:
+          - type: resize
+            dst_width: 128
+            dst_height: 256
+            use_pillow: True
+            interpolation: BILINEAR
+
+        metrics:
+          - name: rank@1
+            type: cmc
+            top_k: 1
+
+          - type: reid_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-0078.yml b/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-0078.yml
index f9a6c8f55dc..6276608a228 100644
--- a/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-0078.yml
+++ b/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-0078.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.xml
         weights: intel/person-vehicle-bike-detection-crossroad-0078/FP32/person-vehicle-bike-detection-crossroad-0078.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.xml
         weights: intel/person-vehicle-bike-detection-crossroad-0078/FP16/person-vehicle-bike-detection-crossroad-0078.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/person-vehicle-bike-detection-crossroad-0078/INT8/person-vehicle-bike-detection-crossroad-0078.xml
-        weights: intel/person-vehicle-bike-detection-crossroad-0078/INT8/person-vehicle-bike-detection-crossroad-0078.bin
+          - FP32-INT8
+        model:   intel/person-vehicle-bike-detection-crossroad-0078/FP32-INT8/person-vehicle-bike-detection-crossroad-0078.xml
+        weights: intel/person-vehicle-bike-detection-crossroad-0078/FP32-INT8/person-vehicle-bike-detection-crossroad-0078.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: crossroad_dataset_0078
@@ -53,3 +50,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-1016.yml b/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-1016.yml
index b6945fd85da..ff4eb99b16e 100644
--- a/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-1016.yml
+++ b/tools/accuracy_checker/configs/person-vehicle-bike-detection-crossroad-1016.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.xml
         weights: intel/person-vehicle-bike-detection-crossroad-1016/FP32/person-vehicle-bike-detection-crossroad-1016.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,7 +15,13 @@ models:
         model:   intel/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.xml
         weights: intel/person-vehicle-bike-detection-crossroad-1016/FP16/person-vehicle-bike-detection-crossroad-1016.bin
         adapter: ssd
-        cpu_extensions: AUTO
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/person-vehicle-bike-detection-crossroad-1016/FP32-INT8/person-vehicle-bike-detection-crossroad-1016.xml
+        weights: intel/person-vehicle-bike-detection-crossroad-1016/FP32-INT8/person-vehicle-bike-detection-crossroad-1016.bin
+        adapter: ssd
 
     datasets:
       - name: crossroad_dataset_1016
@@ -44,3 +49,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: False
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/product-detection-0001.yml b/tools/accuracy_checker/configs/product-detection-0001.yml
new file mode 100644
index 00000000000..0293ba5fe00
--- /dev/null
+++ b/tools/accuracy_checker/configs/product-detection-0001.yml
@@ -0,0 +1,40 @@
+models:
+  - name: product-detection-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/product-detection-0001/FP32/product-detection-0001.xml
+        weights: intel/product-detection-0001/FP32/product-detection-0001.bin
+        adapter: ssd
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/product-detection-0001/FP16/product-detection-0001.xml
+        weights: intel/product-detection-0001/FP16/product-detection-0001.bin
+        adapter: ssd
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/product-detection-0001/FP32-INT8/product-detection-0001.xml
+        weights: intel/product-detection-0001/FP32-INT8/product-detection-0001.bin
+        adapter: ssd
+
+    datasets:
+      - name: product_detection
+
+        preprocessing:
+          - type: resize
+            size: 512
+
+        postprocessing:
+          - type: resize_prediction_boxes
+          - type: cast_to_int
+          - type: filter
+            min_confidence: 0.02
+            apply_to: prediction
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-101.yml b/tools/accuracy_checker/configs/resnet-101.yml
index 24375d1bce5..d526c545e89 100644
--- a/tools/accuracy_checker/configs/resnet-101.yml
+++ b/tools/accuracy_checker/configs/resnet-101.yml
@@ -40,3 +40,5 @@ models:
             aspect_ratio_scale: greater
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-152.yml b/tools/accuracy_checker/configs/resnet-152.yml
index 6fce425053f..9f98fa5eed8 100644
--- a/tools/accuracy_checker/configs/resnet-152.yml
+++ b/tools/accuracy_checker/configs/resnet-152.yml
@@ -40,3 +40,5 @@ models:
             aspect_ratio_scale: greater
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-18-pytorch.yml b/tools/accuracy_checker/configs/resnet-18-pytorch.yml
new file mode 100644
index 00000000000..86d02c7b6ca
--- /dev/null
+++ b/tools/accuracy_checker/configs/resnet-18-pytorch.yml
@@ -0,0 +1,73 @@
+models:
+  - name: resnet-18
+
+    launchers:
+      - framework: onnx_runtime
+        model: public/resnet-18-pytorch/resnet-18-pytorch.onnx
+        adapter: classification
+        inputs:
+          - name: data
+            type: INPUT
+            shape: 1,3,224,224
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        # In order to be used by model, images must be:
+        # 1) Resized to 256x256 with bilinear interpolation
+        # 2) Cropped central part 224x224
+        # 3) Normalized by 255
+        # 4) Normalized by (0.229, 0.224, 0.225) with mean values (0.485, 0.456, 0.406)
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+            use_pillow: true
+            interpolation: BILINEAR
+
+          - type: crop
+            size: 224
+            use_pillow: true
+
+          - type: normalization
+            std: 255
+
+          - type: normalization
+            mean: (0.485, 0.456, 0.406)
+            std: (0.229, 0.224, 0.225)
+
+            # Reference metric from PyTorch (pytorch v1.3.1, torchvision v0.4.2) top-1 69.76% top-5 89.08%
+
+  - name: resnet-18
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/resnet-18-pytorch/FP32/resnet-18-pytorch.xml
+        weights: public/resnet-18-pytorch/FP32/resnet-18-pytorch.bin
+        adapter: classification
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/resnet-18-pytorch/FP16/resnet-18-pytorch.xml
+        weights: public/resnet-18-pytorch/FP16/resnet-18-pytorch.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        reader: pillow_imread
+
+        # Image channels must be swapped, because "pillow_imread" reads in RGB, but converted model expect BGR
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BILINEAR
+          - type: crop
+            size: 224
+            use_pillow: True
+          - type: bgr_to_rgb
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-50-caffe2.yml b/tools/accuracy_checker/configs/resnet-50-caffe2.yml
new file mode 100644
index 00000000000..c907f36670d
--- /dev/null
+++ b/tools/accuracy_checker/configs/resnet-50-caffe2.yml
@@ -0,0 +1,46 @@
+models:
+
+  - name: resnet-50-caffe2
+    launchers:
+      - framework: onnx_runtime
+        model: public/resnet-50-caffe2/resnet-50-caffe2.onnx
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+          - type: normalization
+            mean: 103.53, 116.28, 123.675
+            std: 57.375, 57.12, 58.395
+
+  - name: resnet-50-caffe2
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/resnet-50-caffe2/FP32/resnet-50-caffe2.xml
+        weights: public/resnet-50-caffe2/FP32/resnet-50-caffe2.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/resnet-50-caffe2/FP16/resnet-50-caffe2.xml
+        weights: public/resnet-50-caffe2/FP16/resnet-50-caffe2.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-50-int8-sparse-v1-tf-0001.yml b/tools/accuracy_checker/configs/resnet-50-int8-sparse-v1-tf-0001.yml
deleted file mode 100644
index c6dd2a9e0b1..00000000000
--- a/tools/accuracy_checker/configs/resnet-50-int8-sparse-v1-tf-0001.yml
+++ /dev/null
@@ -1,30 +0,0 @@
-models:
-  - name: resnet-50-int8-sparse-v1-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/resnet-50-int8-sparse-v1-tf-0001/FP32/resnet-50-int8-sparse-v1-tf-0001.xml
-        weights: intel/resnet-50-int8-sparse-v1-tf-0001/FP32/resnet-50-int8-sparse-v1-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-
-    datasets:
-      - name: imagenet_1000_classes
-
-        preprocessing:
-        - type: resize
-          size: 256
-          aspect_ratio_scale: greater
-        - type: crop
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/resnet-50-int8-sparse-v2-tf-0001.yml b/tools/accuracy_checker/configs/resnet-50-int8-sparse-v2-tf-0001.yml
deleted file mode 100644
index d7979ab8a24..00000000000
--- a/tools/accuracy_checker/configs/resnet-50-int8-sparse-v2-tf-0001.yml
+++ /dev/null
@@ -1,30 +0,0 @@
-models:
-  - name: resnet-50-int8-sparse-v2-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/resnet-50-int8-sparse-v2-tf-0001/FP32/resnet-50-int8-sparse-v2-tf-0001.xml
-        weights: intel/resnet-50-int8-sparse-v2-tf-0001/FP32/resnet-50-int8-sparse-v2-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-
-    datasets:
-      - name: imagenet_1000_classes
-
-        preprocessing:
-        - type: resize
-          size: 256
-          aspect_ratio_scale: greater
-        - type: crop
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/resnet-50-int8-tf-0001.yml b/tools/accuracy_checker/configs/resnet-50-int8-tf-0001.yml
deleted file mode 100644
index deaf6346e29..00000000000
--- a/tools/accuracy_checker/configs/resnet-50-int8-tf-0001.yml
+++ /dev/null
@@ -1,30 +0,0 @@
-models:
-  - name: resnet-50-int8-tf-0001
-
-    launchers:
-      - framework: dlsdk
-        tags:
-          - INT8
-        model:   intel/resnet-50-int8-tf-0001/FP32/resnet-50-int8-tf-0001.xml
-        weights: intel/resnet-50-int8-tf-0001/FP32/resnet-50-int8-tf-0001.bin
-        adapter: classification
-        cpu_extensions: AUTO
-
-
-    datasets:
-      - name: imagenet_1000_classes
-
-        preprocessing:
-        - type: resize
-          size: 256
-          aspect_ratio_scale: greater
-        - type: crop
-          size: 224
-
-        metrics:
-          - name: accuracy@top1
-            type: accuracy
-            top_k: 1
-          - name: accuracy@top5
-            type: accuracy
-            top_k: 5
diff --git a/tools/accuracy_checker/configs/resnet-50-pytorch.yml b/tools/accuracy_checker/configs/resnet-50-pytorch.yml
index 0fac50c8e0e..113045274dd 100644
--- a/tools/accuracy_checker/configs/resnet-50-pytorch.yml
+++ b/tools/accuracy_checker/configs/resnet-50-pytorch.yml
@@ -15,7 +15,7 @@ models:
         reader: pillow_imread
 
         # In order to be used by model, images must be:
-        # 1) Resized to 256x256 with bilinear interpolation 
+        # 1) Resized to 256x256 with bilinear interpolation
         # 2) Cropped central part 224x224
         # 3) Normalized by 255
         # 4) Normalized by (0.229, 0.224, 0.225) with mean values (0.485, 0.456, 0.406)
@@ -25,7 +25,7 @@ models:
             aspect_ratio_scale: greater
             use_pillow: true
             interpolation: BILINEAR
-          
+
           - type: crop
             size: 224
             use_pillow: true
@@ -34,14 +34,13 @@ models:
             std: 255
 
           - type: normalization
-            mean: (0.485, 0.456, 0.406) 
+            mean: (0.485, 0.456, 0.406)
             std: (0.229, 0.224, 0.225)
 
-        # Reference metric from PyTorch (pytorch v1.0.1, torchvision v0.2.2) top-1 76.13% top-5 92.862%
+            # Reference metric from PyTorch (pytorch v1.0.1, torchvision v0.2.2) top-1 76.13% top-5 92.862%
 
   - name: resnet-50-pytorch
 
-    launchers:
     launchers:
       - framework: dlsdk
         tags:
@@ -49,7 +48,7 @@ models:
         model:   public/resnet-50-pytorch/FP32/resnet-50-pytorch.xml
         weights: public/resnet-50-pytorch/FP32/resnet-50-pytorch.bin
         adapter: classification
-      
+
       - framework: dlsdk
         tags:
           - FP16
@@ -73,4 +72,6 @@ models:
           - type: crop
             size: 224
             use_pillow: True
-        # Reference metric from PyTorch (pytorch v1.0.1, torchvision v0.2.2) top-1 76.13% top-5 92.862%
+            # Reference metric from PyTorch (pytorch v1.0.1, torchvision v0.2.2) top-1 76.13% top-5 92.862%
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-50-tf.yml b/tools/accuracy_checker/configs/resnet-50-tf.yml
new file mode 100644
index 00000000000..e94c6b90952
--- /dev/null
+++ b/tools/accuracy_checker/configs/resnet-50-tf.yml
@@ -0,0 +1,49 @@
+models:
+  - name: resnet-50-tf
+    launchers:
+      - framework: tf
+        model: public/resnet-50-tf/resnet_v1-50.pb
+        adapter: classification
+        inputs:
+          - name: map/TensorArrayStack/TensorArrayGatherV3
+            type: INPUT
+
+    datasets:
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: bgr_to_rgb
+          - type: normalization
+            mean: [123.68, 116.78, 103.94]
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+
+
+  - name: resnet-50-tf
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/resnet-50-tf/FP32/resnet-50-tf.xml
+        weights: public/resnet-50-tf/FP32/resnet-50-tf.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/resnet-50-tf/FP16/resnet-50-tf.xml
+        weights: public/resnet-50-tf/FP16/resnet-50-tf.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1001_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet-50.yml b/tools/accuracy_checker/configs/resnet-50.yml
index f37723fab68..de661649a12 100644
--- a/tools/accuracy_checker/configs/resnet-50.yml
+++ b/tools/accuracy_checker/configs/resnet-50.yml
@@ -40,3 +40,5 @@ models:
             aspect_ratio_scale: greater
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet18-xnor-binary-onnx-0001.yml b/tools/accuracy_checker/configs/resnet18-xnor-binary-onnx-0001.yml
new file mode 100644
index 00000000000..207bbdd9c77
--- /dev/null
+++ b/tools/accuracy_checker/configs/resnet18-xnor-binary-onnx-0001.yml
@@ -0,0 +1,43 @@
+models:
+  - name: resnet18-xnor-binary-onnx-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32-INT1
+        model:   resnet18-xnor-binary-onnx-0001/FP32-INT1/resnet18-xnor-binary-onnx-0001.xml
+        weights: resnet18-xnor-binary-onnx-0001/FP32-INT1/resnet18-xnor-binary-onnx-0001.bin
+        adapter: classification
+      - framework: dlsdk
+        tags:
+          - FP16-INT1
+        model:   resnet18-xnor-binary-onnx-0001/FP16-INT1/resnet18-xnor-binary-onnx-0001.xml
+        weights: resnet18-xnor-binary-onnx-0001/FP16-INT1/resnet18-xnor-binary-onnx-0001.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        data_source: ImageNet
+        annotation: imagenet1000.pickle
+        reader: pillow_imread
+
+        preprocessing:
+        - type: resize
+          size: 256
+          aspect_ratio_scale: greater
+          use_pillow: True
+          interpolation: BILINEAR
+        - type: crop
+          size: 224
+          use_pillow: True
+        - type: bgr_to_rgb
+
+        metrics:
+          - name: accuracy@top1
+            type: accuracy
+            top_k: 1
+          - name: accuracy@top5
+            type: accuracy
+            top_k: 5
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/resnet50-binary-0001.yml b/tools/accuracy_checker/configs/resnet50-binary-0001.yml
index fa319864441..e16f20d6e0e 100644
--- a/tools/accuracy_checker/configs/resnet50-binary-0001.yml
+++ b/tools/accuracy_checker/configs/resnet50-binary-0001.yml
@@ -4,27 +4,32 @@ models:
     launchers:
       - framework: dlsdk
         tags:
-          - INT1
-        device: CPU
-        model:   intel/resnet50-binary-0001/INT1/resnet50-binary-0001.xml
-        weights: intel/resnet50-binary-0001/INT1/resnet50-binary-0001.bin
+          - FP32-INT1
+        model:   intel/resnet50-binary-0001/FP32-INT1/resnet50-binary-0001.xml
+        weights: intel/resnet50-binary-0001/FP32-INT1/resnet50-binary-0001.bin
         adapter: classification
 
+      - framework: dlsdk
+        tags:
+          - FP16-INT1
+        model:   intel/resnet50-binary-0001/FP16-INT1/resnet50-binary-0001.xml
+        weights: intel/resnet50-binary-0001/FP16-INT1/resnet50-binary-0001.bin
+        adapter: classification
 
     datasets:
       - name: imagenet_1000_classes
         reader: pillow_imread
 
         preprocessing:
-        - type: resize
-          size: 256
-          aspect_ratio_scale: greater
-          use_pillow: True
-          interpolation: BILINEAR
-        - type: crop
-          size: 224
-          use_pillow: True
-        - type: bgr_to_rgb
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+            use_pillow: True
+            interpolation: BILINEAR
+          - type: crop
+            size: 224
+            use_pillow: True
+          - type: bgr_to_rgb
 
         metrics:
           - name: accuracy@top1
@@ -33,3 +38,5 @@ models:
           - name: accuracy@top5
             type: accuracy
             top_k: 5
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/rfcn-resnet101-coco-tf.yml b/tools/accuracy_checker/configs/rfcn-resnet101-coco-tf.yml
new file mode 100644
index 00000000000..c508ad585cb
--- /dev/null
+++ b/tools/accuracy_checker/configs/rfcn-resnet101-coco-tf.yml
@@ -0,0 +1,48 @@
+models:
+  - name:  rfcn-resnet101-coco-tf
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/rfcn-resnet101-coco-tf/FP32/rfcn-resnet101-coco-tf.xml
+        weights: public/rfcn-resnet101-coco-tf/FP32/rfcn-resnet101-coco-tf.bin
+        adapter: ssd
+        inputs:
+          - name: image_info
+            type: CONST_INPUT
+            value: [[600, 600, 1]]
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/rfcn-resnet101-coco-tf/FP16/rfcn-resnet101-coco-tf.xml
+        weights: public/rfcn-resnet101-coco-tf/FP16/rfcn-resnet101-coco-tf.bin
+        adapter: ssd
+        inputs:
+          - name: image_info
+            type: CONST_INPUT
+            value: [[600, 600, 1]]
+
+    datasets:
+      - name: ms_coco_detection_91_classes
+
+        preprocessing:
+            -   type: resize
+                aspect_ratio_scale: fit_to_window
+                dst_height: 600
+                dst_width: 600
+            -   type: padding
+                dst_height: 600
+                dst_width: 600
+                pad_type: right_bottom
+
+        postprocessing:
+            -   type: faster_rcnn_postprocessing_resize
+                dst_height: 600
+                dst_width: 600
+
+        metrics:
+          - type: coco_precision
+            max_detections: 100
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/road-segmentation-adas-0001.yml b/tools/accuracy_checker/configs/road-segmentation-adas-0001.yml
new file mode 100644
index 00000000000..45fa8c8b8e1
--- /dev/null
+++ b/tools/accuracy_checker/configs/road-segmentation-adas-0001.yml
@@ -0,0 +1,35 @@
+models:
+  - name: road-segmentation-adas-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.xml
+        weights: intel/road-segmentation-adas-0001/FP32/road-segmentation-adas-0001.bin
+        adapter: segmentation
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.xml
+        weights: intel/road-segmentation-adas-0001/FP16/road-segmentation-adas-0001.bin
+        adapter: segmentation
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/road-segmentation-adas-0001/FP32-INT8/road-segmentation-adas-0001.xml
+        weights: intel/road-segmentation-adas-0001/FP32-INT8/road-segmentation-adas-0001.bin
+        adapter: segmentation
+
+    datasets:
+      - name: road_segmentation
+        metrics:
+          - type: mean_iou
+            presenter: print_vector
+          - type: mean_accuracy
+            presenter: print_vector
+
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-inception.yml b/tools/accuracy_checker/configs/se-inception.yml
index 4fd25c0dcac..dc05badaa1c 100644
--- a/tools/accuracy_checker/configs/se-inception.yml
+++ b/tools/accuracy_checker/configs/se-inception.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-resnet-101.yml b/tools/accuracy_checker/configs/se-resnet-101.yml
index 6e7dd6a0373..1a9084135bf 100644
--- a/tools/accuracy_checker/configs/se-resnet-101.yml
+++ b/tools/accuracy_checker/configs/se-resnet-101.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-resnet-152.yml b/tools/accuracy_checker/configs/se-resnet-152.yml
index d02eb4ffc83..68dac2d02c9 100644
--- a/tools/accuracy_checker/configs/se-resnet-152.yml
+++ b/tools/accuracy_checker/configs/se-resnet-152.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-resnet-50.yml b/tools/accuracy_checker/configs/se-resnet-50.yml
index 766f65059de..44d17e18077 100644
--- a/tools/accuracy_checker/configs/se-resnet-50.yml
+++ b/tools/accuracy_checker/configs/se-resnet-50.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-resnext-101.yml b/tools/accuracy_checker/configs/se-resnext-101.yml
index 12cea5add9a..673e61c87b3 100644
--- a/tools/accuracy_checker/configs/se-resnext-101.yml
+++ b/tools/accuracy_checker/configs/se-resnext-101.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/se-resnext-50.yml b/tools/accuracy_checker/configs/se-resnext-50.yml
index d968c3824c2..0419c98889f 100644
--- a/tools/accuracy_checker/configs/se-resnext-50.yml
+++ b/tools/accuracy_checker/configs/se-resnext-50.yml
@@ -39,3 +39,5 @@ models:
             size: 256
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/semantic-segmentation-adas-0001.yml b/tools/accuracy_checker/configs/semantic-segmentation-adas-0001.yml
new file mode 100644
index 00000000000..409ab0e9eb2
--- /dev/null
+++ b/tools/accuracy_checker/configs/semantic-segmentation-adas-0001.yml
@@ -0,0 +1,46 @@
+models:
+  - name: semantic-segmentation-adas-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.xml
+        weights: intel/semantic-segmentation-adas-0001/FP32/semantic-segmentation-adas-0001.bin
+        adapter: segmentation
+        inputs:
+          - name: data
+            type: INPUT
+            precision: U8
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.xml
+        weights: intel/semantic-segmentation-adas-0001/FP16/semantic-segmentation-adas-0001.bin
+        adapter: segmentation
+        inputs:
+          - name: data
+            type: INPUT
+            precision: U8
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/semantic-segmentation-adas-0001/FP32-INT8/semantic-segmentation-adas-0001.xml
+        weights: intel/semantic-segmentation-adas-0001/FP32-INT8/semantic-segmentation-adas-0001.bin
+        adapter: segmentation
+        inputs:
+          - name: data
+            type: INPUT
+            precision: U8
+
+    datasets:
+      - name: semantic_segmentation_adas
+
+        metrics:
+          - type: mean_iou
+            use_argmax: False
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/single-human-pose-estimation-0001.yml b/tools/accuracy_checker/configs/single-human-pose-estimation-0001.yml
new file mode 100644
index 00000000000..f7211683b88
--- /dev/null
+++ b/tools/accuracy_checker/configs/single-human-pose-estimation-0001.yml
@@ -0,0 +1,31 @@
+models:
+  - name: single-human-pose-estimation-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/single-human-pose-estimation-0001/FP32/single-human-pose-estimation-0001.xml
+        weights: public/single-human-pose-estimation-0001/FP32/single-human-pose-estimation-0001.bin
+        adapter:
+          type: single_human_pose_estimation
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/single-human-pose-estimation-0001/FP16/single-human-pose-estimation-0001.xml
+        weights: public/single-human-pose-estimation-0001/FP16/single-human-pose-estimation-0001.bin
+        adapter:
+          type: single_human_pose_estimation
+
+    datasets:
+      - name: ms_coco_single_keypoints
+        preprocessing:
+          - type: transformed_crop_with_auto_scale
+            dst_height: 384
+            dst_width: 288
+            stride: 8
+        metrics:
+          - name: AP
+            type: coco_orig_keypoints_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/single-image-super-resolution-1032.yml b/tools/accuracy_checker/configs/single-image-super-resolution-1032.yml
new file mode 100644
index 00000000000..120b829734c
--- /dev/null
+++ b/tools/accuracy_checker/configs/single-image-super-resolution-1032.yml
@@ -0,0 +1,56 @@
+models:
+  - name: single-image-super-resolution-1032
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.xml
+        weights: intel/single-image-super-resolution-1032/FP32/single-image-super-resolution-1032.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x4*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x4*.png"
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.xml
+        weights: intel/single-image-super-resolution-1032/FP16/single-image-super-resolution-1032.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x4*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x4*.png"
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/single-image-super-resolution-1032/FP32-INT8/single-image-super-resolution-1032.xml
+        weights: intel/single-image-super-resolution-1032/FP32-INT8/single-image-super-resolution-1032.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x4*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x4*.png"
+
+    datasets:
+      - name: super_resolution_x4
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/single-image-super-resolution-1033.yml b/tools/accuracy_checker/configs/single-image-super-resolution-1033.yml
new file mode 100644
index 00000000000..516005e1257
--- /dev/null
+++ b/tools/accuracy_checker/configs/single-image-super-resolution-1033.yml
@@ -0,0 +1,61 @@
+models:
+  - name: single-image-super-resolution-1033
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.xml
+        weights: intel/single-image-super-resolution-1033/FP32/single-image-super-resolution-1033.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x3*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x3*.png"
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.xml
+        weights: intel/single-image-super-resolution-1033/FP16/single-image-super-resolution-1033.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x3*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x3*.png"
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/single-image-super-resolution-1033/FP32-INT8/single-image-super-resolution-1033.xml
+        weights: intel/single-image-super-resolution-1033/FP32-INT8/single-image-super-resolution-1033.bin
+        adapter:
+          type: super_resolution
+          reverse_channels: True
+        inputs:
+          - name: "0"
+            type: INPUT
+            value: ".*lr_x3*.png"
+          - name: "1"
+            type: INPUT
+            value: ".*upsample_x3*.png"
+
+    datasets:
+      - name: super_resolution_x3
+
+        metrics:
+          - type: psnr
+            scale_border: 4
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/squeezenet1.0.yml b/tools/accuracy_checker/configs/squeezenet1.0.yml
index 9450d8b7c38..aa9a43d497d 100644
--- a/tools/accuracy_checker/configs/squeezenet1.0.yml
+++ b/tools/accuracy_checker/configs/squeezenet1.0.yml
@@ -38,3 +38,5 @@ models:
             size: 256
           - type: crop
             size: 227
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/squeezenet1.1-caffe2.yml b/tools/accuracy_checker/configs/squeezenet1.1-caffe2.yml
new file mode 100644
index 00000000000..404d81d2dd5
--- /dev/null
+++ b/tools/accuracy_checker/configs/squeezenet1.1-caffe2.yml
@@ -0,0 +1,44 @@
+models:
+  - name: squeezenet1.1-caffe2
+
+    launchers:
+      - framework: onnx_runtime
+        model: public/squeezenet1.1-caffe2/squeezenet1.1-caffe2.onnx
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+          - type: crop
+            size: 227
+          - type: normalization
+            mean: 103.96,116.78,123.68
+
+  - name: squeezenet1.1-caffe2
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/squeezenet1.1-caffe2/FP32/squeezenet1.1-caffe2.xml
+        weights: public/squeezenet1.1-caffe2/FP32/squeezenet1.1-caffe2.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/squeezenet1.1-caffe2/FP16/squeezenet1.1-caffe2.xml
+        weights: public/squeezenet1.1-caffe2/FP16/squeezenet1.1-caffe2.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 227
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/squeezenet1.1.yml b/tools/accuracy_checker/configs/squeezenet1.1.yml
index 8de59f46113..8e54e9aae2e 100644
--- a/tools/accuracy_checker/configs/squeezenet1.1.yml
+++ b/tools/accuracy_checker/configs/squeezenet1.1.yml
@@ -38,3 +38,5 @@ models:
             size: 256
           - type: crop
             size: 227
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssd300.yml b/tools/accuracy_checker/configs/ssd300.yml
index f53e94ec0d5..7b42d50844c 100644
--- a/tools/accuracy_checker/configs/ssd300.yml
+++ b/tools/accuracy_checker/configs/ssd300.yml
@@ -23,7 +23,6 @@ models:
         model:   public/ssd300/FP32/ssd300.xml
         weights: public/ssd300/FP32/ssd300.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -31,7 +30,6 @@ models:
         model:   public/ssd300/FP16/ssd300.xml
         weights: public/ssd300/FP16/ssd300.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: VOC2012
@@ -40,3 +38,5 @@ models:
             size: 300
         postprocessing:
           - type: resize_prediction_boxes
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssd512.yml b/tools/accuracy_checker/configs/ssd512.yml
index 39190060f8f..eb709a903a4 100644
--- a/tools/accuracy_checker/configs/ssd512.yml
+++ b/tools/accuracy_checker/configs/ssd512.yml
@@ -23,7 +23,6 @@ models:
         model:   public/ssd512/FP32/ssd512.xml
         weights: public/ssd512/FP32/ssd512.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -31,7 +30,6 @@ models:
         model:   public/ssd512/FP16/ssd512.xml
         weights: public/ssd512/FP16/ssd512.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: VOC2012
@@ -40,3 +38,5 @@ models:
             size: 512
         postprocessing:
           - type: resize_prediction_boxes
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssd_mobilenet_v1_coco.yml b/tools/accuracy_checker/configs/ssd_mobilenet_v1_coco.yml
index 306ed2f471b..50176a66d5e 100644
--- a/tools/accuracy_checker/configs/ssd_mobilenet_v1_coco.yml
+++ b/tools/accuracy_checker/configs/ssd_mobilenet_v1_coco.yml
@@ -24,3 +24,5 @@ models:
           - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssd_mobilenet_v1_fpn_coco.yml b/tools/accuracy_checker/configs/ssd_mobilenet_v1_fpn_coco.yml
index 6b7f5e3ce5e..0b1bcdac5ce 100644
--- a/tools/accuracy_checker/configs/ssd_mobilenet_v1_fpn_coco.yml
+++ b/tools/accuracy_checker/configs/ssd_mobilenet_v1_fpn_coco.yml
@@ -24,3 +24,5 @@ models:
           - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssd_mobilenet_v2_coco.yml b/tools/accuracy_checker/configs/ssd_mobilenet_v2_coco.yml
index efe661303a6..4265ab76b62 100644
--- a/tools/accuracy_checker/configs/ssd_mobilenet_v2_coco.yml
+++ b/tools/accuracy_checker/configs/ssd_mobilenet_v2_coco.yml
@@ -24,3 +24,5 @@ models:
           - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/ssdlite_mobilenet_v2.yml b/tools/accuracy_checker/configs/ssdlite_mobilenet_v2.yml
index b9364884565..49e6ad09610 100644
--- a/tools/accuracy_checker/configs/ssdlite_mobilenet_v2.yml
+++ b/tools/accuracy_checker/configs/ssdlite_mobilenet_v2.yml
@@ -24,3 +24,5 @@ models:
           - type: resize_prediction_boxes
         metrics:
           - type: coco_precision
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/text-detection-0003.yml b/tools/accuracy_checker/configs/text-detection-0003.yml
index 00e7bc56a55..215d932f1f9 100644
--- a/tools/accuracy_checker/configs/text-detection-0003.yml
+++ b/tools/accuracy_checker/configs/text-detection-0003.yml
@@ -22,7 +22,7 @@ models:
         model:   intel/text-detection-0003/FP16/text-detection-0003.xml
         weights: intel/text-detection-0003/FP16/text-detection-0003.bin
         adapter:
-          type: text_detection
+          type: pixel_link_text_detection
           pixel_link_out: model/link_logits_/add
           pixel_class_out: model/segm_logits/add
           pixel_class_confidence_threshold: 0.8
@@ -32,12 +32,12 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
+          - FP32-INT8
         device: CPU
-        model:   intel/text-detection-0003/INT8/text-detection-0003.xml
-        weights: intel/text-detection-0003/INT8/text-detection-0003.bin
+        model:   intel/text-detection-0003/FP32-INT8/text-detection-0003.xml
+        weights: intel/text-detection-0003/FP32-INT8/text-detection-0003.bin
         adapter:
-          type: text_detection
+          type: pixel_link_text_detection
           pixel_link_out: model/link_logits_/add
           pixel_class_out: model/segm_logits/add
           pixel_class_confidence_threshold: 0.8
@@ -48,11 +48,6 @@ models:
     datasets:
       - name: ICDAR2015
 
-        data_source: ICDAR15_DET_validation/ch4_test_images
-        annotation_conversion:
-          converter: icdar_detection
-          data_dir: ICDAR15_DET_validation/gt
-
         preprocessing:
           - type: resize
             dst_width: 1280
@@ -73,3 +68,5 @@ models:
           - type: incidental_text_hmean
             name: f-measure
             ignore_difficult: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/text-detection-0004.yml b/tools/accuracy_checker/configs/text-detection-0004.yml
index a0a8686bf2a..b1ef29f2fee 100644
--- a/tools/accuracy_checker/configs/text-detection-0004.yml
+++ b/tools/accuracy_checker/configs/text-detection-0004.yml
@@ -15,13 +15,12 @@ models:
           pixel_link_confidence_threshold: 0.8
           min_area: 300
           min_height: 10
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
           - FP16
         model:   intel/text-detection-0004/FP16/text-detection-0004.xml
-        weights: intel/text-detection-0004/dldt/FP16/text-detection-0004.bin
+        weights: intel/text-detection-0004/FP16/text-detection-0004.bin
         adapter:
           type: pixel_link_text_detection
           pixel_link_out: model/link_logits_/add
@@ -30,14 +29,12 @@ models:
           pixel_link_confidence_threshold: 0.8
           min_area: 300
           min_height: 10
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/text-detection-0004/INT8/text-detection-0004.xml
-        weights: intel/text-detection-0004/INT8/text-detection-0004.bin
+          - FP32-INT8
+        model:   intel/text-detection-0004/FP32-INT8/text-detection-0004.xml
+        weights: intel/text-detection-0004/FP32-INT8/text-detection-0004.bin
         adapter:
           type: pixel_link_text_detection
           pixel_link_out: model/link_logits_/add
@@ -50,11 +47,6 @@ models:
     datasets:
       - name: ICDAR2015
 
-        data_source: ICDAR15_DET_validation/ch4_test_images
-        annotation_conversion:
-          converter: icdar_detection
-          data_dir: ICDAR15_DET_validation/gt
-
         preprocessing:
           - type: resize
             dst_width: 1280
@@ -75,3 +67,5 @@ models:
           - type: incidental_text_hmean
             name: f-measure
             ignore_difficult: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/text-image-super-resolution-0001.yml b/tools/accuracy_checker/configs/text-image-super-resolution-0001.yml
new file mode 100644
index 00000000000..348a6434446
--- /dev/null
+++ b/tools/accuracy_checker/configs/text-image-super-resolution-0001.yml
@@ -0,0 +1,32 @@
+models:
+  - name: text-image-super-resolution-0001
+
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   intel/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.xml
+        weights: intel/text-image-super-resolution-0001/FP32/text-image-super-resolution-0001.bin
+        adapter:
+          type: super_resolution
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   intel/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.xml
+        weights: intel/text-image-super-resolution-0001/FP16/text-image-super-resolution-0001.bin
+        adapter:
+          type: super_resolution
+
+      - framework: dlsdk
+        tags:
+          - FP32-INT8
+        model:   intel/text-image-super-resolution-0001/FP32-INT8/text-image-super-resolution-0001.xml
+        weights: intel/text-image-super-resolution-0001/FP32-INT8/text-image-super-resolution-0001.bin
+        adapter:
+          type: super_resolution
+
+    datasets:
+      - name: text_super_resolution_x3
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/text-recognition-0012.yml b/tools/accuracy_checker/configs/text-recognition-0012.yml
index 6bc5d50ac73..693b946d5da 100644
--- a/tools/accuracy_checker/configs/text-recognition-0012.yml
+++ b/tools/accuracy_checker/configs/text-recognition-0012.yml
@@ -18,18 +18,13 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        device: CPU
-        model:   intel/text-recognition-0012/INT8/text-recognition-0012.xml
-        weights: intel/text-recognition-0012/INT8/text-recognition-0012.bin
+          - FP32-INT8
+        model:   intel/text-recognition-0012/FP32-INT8/text-recognition-0012.xml
+        weights: intel/text-recognition-0012/FP32-INT8/text-recognition-0012.bin
         adapter: beam_search_decoder
 
     datasets:
       - name: ICDAR2013
-        data_source: ICDAR13_REC_validation/Challenge2_Test_Task3_Images
-        annotation_conversion:
-          converter: icdar13_recognition
-          annotation_file: ICDAR13_REC_validation/gt/gt.txt.fixed.alfanumeric
 
         preprocessing:
           - type: bgr_to_gray
@@ -39,3 +34,5 @@ models:
 
         metrics:
           - type: character_recognition_accuracy
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/text-spotting-0001.yml b/tools/accuracy_checker/configs/text-spotting-0001.yml
new file mode 100644
index 00000000000..0f57727d5a2
--- /dev/null
+++ b/tools/accuracy_checker/configs/text-spotting-0001.yml
@@ -0,0 +1,120 @@
+evaluations:
+  - name: text-spotting-0001
+    module: custom_evaluators.text_spotting_evaluator.TextSpottingEvaluator
+    module_config:
+      network_info:
+        detector:
+          model:   intel/text-spotting-0001-detector/FP32/text-spotting-0001-detector.xml
+          weights: intel/text-spotting-0001-detector/FP32/text-spotting-0001-detector.bin
+
+        recognizer_encoder:
+          model:   intel/text-spotting-0001-recognizer-encoder/FP32/text-spotting-0001-recognizer-encoder.xml
+          weights: intel/text-spotting-0001-recognizer-encoder/FP32/text-spotting-0001-recognizer-encoder.bin
+
+        recognizer_decoder:
+          model:   intel/text-spotting-0001-recognizer-decoder/FP32/text-spotting-0001-recognizer-decoder.xml
+          weights: intel/text-spotting-0001-recognizer-decoder/FP32/text-spotting-0001-recognizer-decoder.bin
+
+        recognizer_decoder_inputs:
+          prev_symbol: prev_symbol
+          prev_hidden: prev_hidden
+          encoder_outputs: encoder_outputs
+
+        recognizer_decoder_outputs:
+          symbols_distribution: output
+          cur_hidden: hidden
+
+        max_seq_len: '28'
+
+        alphabet: __0123456789abcdefghijklmnopqrstuvwxyz
+        sos_index: '0'
+        eos_index: '1'
+
+        adapter:
+          type: mask_rcnn_with_text
+          classes_out: classes
+          scores_out: scores
+          boxes_out: boxes
+          raw_masks_out: raw_masks
+          texts_out: texts
+          confidence_threshold: 0.8
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP32
+
+      datasets:
+        - name: ICDAR2015_word_spotting
+
+          preprocessing:
+            - type: resize
+              dst_width: 1280
+              dst_height: 768
+
+          metrics:
+            - type: incidental_text_hmean
+              name: f-measure
+              ignore_difficult: True
+              word_spotting: True
+
+  - name: text-spotting-0001
+    module: custom_evaluators.text_spotting_evaluator.TextSpottingEvaluator
+    module_config:
+      network_info:
+        detector:
+          model:   intel/text-spotting-0001-detector/FP16/text-spotting-0001-detector.xml
+          weights: intel/text-spotting-0001-detector/FP16/text-spotting-0001-detector.bin
+
+        recognizer_encoder:
+          model:   intel/text-spotting-0001-recognizer-encoder/FP16/text-spotting-0001-recognizer-encoder.xml
+          weights: intel/text-spotting-0001-recognizer-encoder/FP16/text-spotting-0001-recognizer-encoder.bin
+
+        recognizer_decoder:
+          model:   intel/text-spotting-0001-recognizer-decoder/FP16/text-spotting-0001-recognizer-decoder.xml
+          weights: intel/text-spotting-0001-recognizer-decoder/FP16/text-spotting-0001-recognizer-decoder.bin
+
+        recognizer_decoder_inputs:
+          prev_symbol: prev_symbol
+          prev_hidden: prev_hidden
+          encoder_outputs: encoder_outputs
+
+        recognizer_decoder_outputs:
+          symbols_distribution: output
+          cur_hidden: hidden
+
+        max_seq_len: '28'
+
+        alphabet: __0123456789abcdefghijklmnopqrstuvwxyz
+        sos_index: '0'
+        eos_index: '1'
+
+        adapter:
+          type: mask_rcnn_with_text
+          classes_out: classes
+          scores_out: scores
+          boxes_out: boxes
+          raw_masks_out: raw_masks
+          texts_out: texts
+          confidence_threshold: 0.8
+
+      launchers:
+        - framework: dlsdk
+          tags:
+            - FP16
+
+      datasets:
+        - name: ICDAR2015_word_spotting
+
+          preprocessing:
+            - type: resize
+              dst_width: 1280
+              dst_height: 768
+
+          metrics:
+            - type: incidental_text_hmean
+              name: f-measure
+              ignore_difficult: True
+              word_spotting: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vehicle-attributes-recognition-barrier-0039.yml b/tools/accuracy_checker/configs/vehicle-attributes-recognition-barrier-0039.yml
index 71ca136a06f..75d0fd382e4 100644
--- a/tools/accuracy_checker/configs/vehicle-attributes-recognition-barrier-0039.yml
+++ b/tools/accuracy_checker/configs/vehicle-attributes-recognition-barrier-0039.yml
@@ -24,9 +24,9 @@ models:
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/vehicle-attributes-recognition-barrier-0039/INT8/vehicle-attributes-recognition-barrier-0039.xml
-        weights: intel/vehicle-attributes-recognition-barrier-0039/INT8/vehicle-attributes-recognition-barrier-0039.bin
+          - FP32-INT8
+        model:   intel/vehicle-attributes-recognition-barrier-0039/FP32-INT8/vehicle-attributes-recognition-barrier-0039.xml
+        weights: intel/vehicle-attributes-recognition-barrier-0039/FP32-INT8/vehicle-attributes-recognition-barrier-0039.bin
         adapter:
           type: vehicle_attributes
           color_out: color
@@ -57,3 +57,5 @@ models:
             annotation_source: type
             prediction_source: type
             label_map: type_label_map
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vehicle-detection-adas-0002.yml b/tools/accuracy_checker/configs/vehicle-detection-adas-0002.yml
index e18776a06fc..39df2912114 100644
--- a/tools/accuracy_checker/configs/vehicle-detection-adas-0002.yml
+++ b/tools/accuracy_checker/configs/vehicle-detection-adas-0002.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.xml
         weights: intel/vehicle-detection-adas-0002/FP32/vehicle-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.xml
         weights: intel/vehicle-detection-adas-0002/FP16/vehicle-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/vehicle-detection-adas-0002/INT8/vehicle-detection-adas-0002.xml
-        weights: intel/vehicle-detection-adas-0002/INT8/vehicle-detection-adas-0002.bin
+          - FP32-INT8
+        model:   intel/vehicle-detection-adas-0002/FP32-INT8/vehicle-detection-adas-0002.xml
+        weights: intel/vehicle-detection-adas-0002/FP32-INT8/vehicle-detection-adas-0002.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: vehicle_detection_dataset
@@ -49,3 +46,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vehicle-detection-adas-binary-0001.yml b/tools/accuracy_checker/configs/vehicle-detection-adas-binary-0001.yml
index b273e01b8c2..a8570d305de 100644
--- a/tools/accuracy_checker/configs/vehicle-detection-adas-binary-0001.yml
+++ b/tools/accuracy_checker/configs/vehicle-detection-adas-binary-0001.yml
@@ -4,11 +4,10 @@ models:
     launchers:
       - framework: dlsdk
         tags:
-          - INT1
-        model:   intel/vehicle-detection-adas-binary-0001/INT1/vehicle-detection-adas-binary-0001.xml
-        weights: intel/vehicle-detection-adas-binary-0001/INT1/vehicle-detection-adas-binary-0001.bin
+          - FP32-INT1
+        model:   intel/vehicle-detection-adas-binary-0001/FP32-INT1/vehicle-detection-adas-binary-0001.xml
+        weights: intel/vehicle-detection-adas-binary-0001/FP32-INT1/vehicle-detection-adas-binary-0001.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: vehicle_detection_dataset
@@ -33,3 +32,5 @@ models:
             include_boundaries: True
             allow_multiple_matches_per_ignored: True
             use_filtered_tp: True
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0106.yml b/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0106.yml
index 5578d51c47f..2acb7bbe331 100644
--- a/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0106.yml
+++ b/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0106.yml
@@ -8,7 +8,6 @@ models:
         model:   intel/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.xml
         weights: intel/vehicle-license-plate-detection-barrier-0106/FP32/vehicle-license-plate-detection-barrier-0106.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
@@ -16,15 +15,13 @@ models:
         model:   intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.xml
         weights: intel/vehicle-license-plate-detection-barrier-0106/FP16/vehicle-license-plate-detection-barrier-0106.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
       - framework: dlsdk
         tags:
-          - INT8
-        model:   intel/vehicle-license-plate-detection-barrier-0106/INT8/vehicle-license-plate-detection-barrier-0106.xml
-        weights: intel/vehicle-license-plate-detection-barrier-0106/INT8/vehicle-license-plate-detection-barrier-0106.bin
+          - FP32-INT8
+        model:   intel/vehicle-license-plate-detection-barrier-0106/FP32-INT8/vehicle-license-plate-detection-barrier-0106.xml
+        weights: intel/vehicle-license-plate-detection-barrier-0106/FP32-INT8/vehicle-license-plate-detection-barrier-0106.bin
         adapter: ssd
-        cpu_extensions: AUTO
 
     datasets:
       - name: vehicle_license_plate_detection
@@ -55,3 +52,5 @@ models:
             allow_multiple_matches_per_ignored: True
             distinct_conf: False
             presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0123.yml b/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0123.yml
new file mode 100644
index 00000000000..94bc2b433c1
--- /dev/null
+++ b/tools/accuracy_checker/configs/vehicle-license-plate-detection-barrier-0123.yml
@@ -0,0 +1,54 @@
+models:
+  - name: vehicle-license-plate-detection-barrier-0123
+
+    launchers:
+      - framework: tf
+        device: CPU
+        model:   public/vehicle-license-plate-detection-barrier-0123/model/model.pb.frozen
+        adapter: ssd
+
+      - framework: dlsdk
+        tags:
+          - FP32
+        model: public/vehicle-license-plate-detection-barrier-0123/FP32/vehicle-license-plate-detection-barrier-0123.xml
+        weights: public/vehicle-license-plate-detection-barrier-0123/FP32/vehicle-license-plate-detection-barrier-0123.bin
+        adapter: ssd
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model: public/vehicle-license-plate-detection-barrier-0123/FP16/vehicle-license-plate-detection-barrier-0123.xml
+        weights: public/vehicle-license-plate-detection-barrier-0123/FP16/vehicle-license-plate-detection-barrier-0123.bin
+        adapter: ssd
+
+    datasets:
+      - name: vehicle_license_plate_detection
+
+        preprocessing:
+          - type: resize
+            dst_width: 256
+            dst_height: 256
+
+        postprocessing:
+          - type: clip_boxes
+            apply_to: prediction
+            dst_width: 1
+            dst_height: 1
+          - type: resize_prediction_boxes
+          - type: filter
+            apply_to: prediction
+            min_confidence: 0.005
+            is_empty: True
+          - type: filter
+            apply_to: annotation
+            area_ratio: 0.034722222222222224
+
+        metrics:
+          - type: map
+            ignore_difficult: True
+            include_boundaries: False
+            allow_multiple_matches_per_ignored: True
+            distinct_conf: False
+            presenter: print_vector
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vgg16.yml b/tools/accuracy_checker/configs/vgg16.yml
index 7756740941f..21e68355699 100644
--- a/tools/accuracy_checker/configs/vgg16.yml
+++ b/tools/accuracy_checker/configs/vgg16.yml
@@ -40,3 +40,5 @@ models:
             aspect_ratio_scale: greater
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vgg19-caffe2.yml b/tools/accuracy_checker/configs/vgg19-caffe2.yml
new file mode 100644
index 00000000000..18e4ee2d6a0
--- /dev/null
+++ b/tools/accuracy_checker/configs/vgg19-caffe2.yml
@@ -0,0 +1,45 @@
+models:
+
+  - name: vgg19-caffe2
+    launchers:
+      - framework: onnx_runtime
+        model: public/vgg19-caffe2/vgg19-caffe2.onnx
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+          - type: normalization
+            mean: 103.939, 116.779, 123.68
+
+  - name: vgg19-caffe2
+    launchers:
+      - framework: dlsdk
+        tags:
+          - FP32
+        model:   public/vgg19-caffe2/FP32/vgg19-caffe2.xml
+        weights: public/vgg19-caffe2/FP32/vgg19-caffe2.bin
+        adapter: classification
+
+      - framework: dlsdk
+        tags:
+          - FP16
+        model:   public/vgg19-caffe2/FP16/vgg19-caffe2.xml
+        weights: public/vgg19-caffe2/FP16/vgg19-caffe2.bin
+        adapter: classification
+
+    datasets:
+      - name: imagenet_1000_classes
+        preprocessing:
+          - type: resize
+            size: 256
+            aspect_ratio_scale: greater
+          - type: crop
+            size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/configs/vgg19.yml b/tools/accuracy_checker/configs/vgg19.yml
index 7f9cdd83616..a9bcdacdabb 100644
--- a/tools/accuracy_checker/configs/vgg19.yml
+++ b/tools/accuracy_checker/configs/vgg19.yml
@@ -40,3 +40,5 @@ models:
             aspect_ratio_scale: greater
           - type: crop
             size: 224
+
+global_definitions: ../dataset_definitions.yml
diff --git a/tools/accuracy_checker/custom_evaluators/README.md b/tools/accuracy_checker/custom_evaluators/README.md
new file mode 100644
index 00000000000..4a85a073bab
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/README.md
@@ -0,0 +1,42 @@
+# Custom Evaluators for Accuracy Checker
+Standard Accuracy Checker validation pipeline: Annotation Reading -> Data Reading -> Preprocessing -> Inference -> Postprocessing -> Metrics.
+In some cases it can be unsuitable (e.g. if you have sequence of models). You are able to customize validation pipeline using own evaluator.
+Suggested approach based on writing python module which will describe validation approach
+
+## Implementation
+Adding new evaluator process similar with adding any other entities in the tool.
+Custom evaluator is the class which should be inherited from BaseEvaluator and overwrite all abstract methods.
+
+The most important methods for overwriting:
+
+* `from_configs` - create new instance using configuration dictionary.
+* `process_dataset` - determine validation cycle across all data batches in dataset.
+* `compute_metrics` - metrics evaluation after dataset processing.
+* `reset` - reset evaluation progress
+
+## Configuration
+Each custom evaluation config should start with keyword `evaluation` and contain:
+ * `name` - model name
+ * `module` - evaluation module for loading. 
+Before running, please make sure that prefix to module added to your python path or use `python_path` parameter in config for it specification.
+Optionally you can provide `module_config` section which contains config for custom evaluator (Depends from realization, it can contains evaluator specific parameters).
+
+
+## Examples
+* **Sequential Action Recognition Evaluator** demonstrates how to run Action Recognition models with encoder + decoder architecture.
+  [Evaluator code](sequential_action_recognition_evaluator.py)
+  Configuration file examples:
+    * [action-recognition-0001-encoder](../configs/action-recognition-0001-encoder.yml) - running full pipeline of action recognition model.
+    * [action-recognition-0001-decoder](../configs/action-recognition-0001-decoder.yml) - running only decoder stage with dumped embeddings of encoder.
+
+* **MTCNN Evaluator** shows how to run MTCNN model.
+  [Evaluator code](mtcnn_evaluator.py)
+  Configuration file examples:
+    * [mtcnn-p](../configs/mtcnn-p.yml) - running proposal stage of MTCNN as usual model.
+    * [mtcnn-r](../configs/mtcnn-r.yml) - running only refine stage of MTCNN using dumped proposal stage results.
+    * [mtcnn-o](../configs/mtcnn-o.yml) - running full MTCNN pipeline.
+
+* **Text Spotting Evaluator** demonstrates how to evaluate text-spotting-0001 model via Accuracy Checker.
+  [Evaluator code](text_spotting_evaluator.py)
+  Configuration file examples:
+    * [text-spotting-0001](../configs/text-spotting-0001.yml)
diff --git a/tools/accuracy_checker/custom_evaluators/__init__.py b/tools/accuracy_checker/custom_evaluators/__init__.py
new file mode 100644
index 00000000000..7c9fcf6dc14
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/__init__.py
@@ -0,0 +1,15 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
diff --git a/tools/accuracy_checker/custom_evaluators/colorization_evaluator.py b/tools/accuracy_checker/custom_evaluators/colorization_evaluator.py
new file mode 100644
index 00000000000..95d3b1b9048
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/colorization_evaluator.py
@@ -0,0 +1,217 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+import numpy as np
+import cv2
+
+from accuracy_checker.evaluators.base_evaluator import BaseEvaluator
+from accuracy_checker.dataset import Dataset
+from accuracy_checker.adapters import create_adapter
+from accuracy_checker.data_readers import BaseReader
+from accuracy_checker.config import ConfigError
+from accuracy_checker.preprocessor import PreprocessingExecutor
+from accuracy_checker.metrics import MetricsExecutor
+from accuracy_checker.launcher import create_launcher
+from accuracy_checker.utils import extract_image_representations, get_path, contains_all
+
+
+class ColorizationEvaluator(BaseEvaluator):
+    def __init__(self, dataset, reader, preprocessing, metric_executor, launcher, test_model, check_model):
+        self.dataset = dataset
+        self.preprocessing_executor = preprocessing
+        self.metric_executor = metric_executor
+        self.launcher = launcher
+        self.test_model = test_model
+        self.check_model = check_model
+        self.reader = reader
+        self._metrics_results = []
+
+    @classmethod
+    def from_configs(cls, config):
+        dataset_config = config['datasets'][0]
+        dataset = Dataset(dataset_config)
+        data_reader_config = dataset_config.get('reader', 'opencv_imread')
+        data_source = dataset_config['data_source']
+        if isinstance(data_reader_config, str):
+            reader = BaseReader.provide(data_reader_config, data_source)
+        elif isinstance(data_reader_config, dict):
+            reader = BaseReader.provide(data_reader_config['type'], data_source, data_reader_config)
+        else:
+            raise ConfigError('reader should be dict or string')
+        preprocessing = PreprocessingExecutor(dataset_config.get('preprocessing', []), dataset.name)
+        metrics_executor = MetricsExecutor(dataset_config['metrics'], dataset)
+        launcher_settings = config['launchers'][0]
+        supported_frameworks = ['dlsdk']
+        if not launcher_settings['framework'] in supported_frameworks:
+            raise ConfigError('{} framework not supported'.format(launcher_settings['framework']))
+        launcher = create_launcher(launcher_settings, delayed_model_loading=True)
+        network_info = config.get('network_info', {})
+        if not contains_all(network_info, ['colorization_network', 'verification_network']):
+            raise ConfigError('configuration for colorization_network/verification_network does not exist')
+
+        test_model = ColorizationTestModel(network_info['colorization_network'], launcher)
+        check_model = ColorizationCheckModel(network_info['verification_network'], launcher)
+        return cls(dataset, reader, preprocessing, metrics_executor, launcher, test_model, check_model)
+
+    def process_dataset(self, _, progress_reporter):
+        self._annotations, self._predictions = ([], []) if self.metric_executor.need_store_predictions else None, None
+        if progress_reporter:
+            progress_reporter.reset(self.dataset.size)
+
+        for batch_id, (dataset_indices, batch_annotation) in enumerate(self.dataset):
+            batch_identifiers = [annotation.identifier for annotation in batch_annotation]
+            batch_input = [self.reader(identifier=identifier) for identifier in batch_identifiers]
+            batch_input = self.preprocessing_executor.process(batch_input, batch_annotation)
+            batch_input, _ = extract_image_representations(batch_input)
+            batch_out = self.test_model.predict(batch_annotation, batch_input)
+            batch_prediction = self.check_model.predict(batch_identifiers, batch_out)
+            self.metric_executor.update_metrics_on_batch(dataset_indices, batch_annotation, batch_prediction)
+            if self.metric_executor.need_store_predictions:
+                self._annotations.extend(batch_annotation)
+                self._predictions.extend(batch_prediction)
+            progress_reporter.update(batch_id, len(batch_prediction))
+
+        if progress_reporter:
+            progress_reporter.finish()
+
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        if self._metrics_results:
+            del self._metrics_results
+            self._metrics_results = []
+
+        for result_presenter, evaluated_metric in self.metric_executor.iterate_metrics(
+            self._annotations, self._predictions):
+            self._metrics_results.append(evaluated_metric)
+            if print_results:
+                result_presenter.write_result(evaluated_metric, ignore_results_formatting)
+
+        return self._metrics_results
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
+            return
+        result_presenters = self.metric_executor.get_metric_presenters()
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            presenter.write_results(metric_result, ignore_results_formatting)
+
+    def release(self):
+        self.launcher.release()
+
+    def reset(self):
+        self.metric_executor.reset()
+
+    @staticmethod
+    def get_processing_info(config):
+        module_specific_params = config.get('module_config')
+        model_name = config['name']
+        dataset_config = module_specific_params['datasets'][0]
+        launcher_config = module_specific_params['launchers'][0]
+        return (
+            model_name, launcher_config['framework'], launcher_config['device'], launcher_config.get('tags'),
+            dataset_config['name']
+        )
+
+
+class BaseModel:
+    def check_format(self, model_xml, model_bin):
+        if not get_path(model_xml).suffix == '.xml':
+            raise ConfigError('{} format not supported'.format(model_xml))
+        if not get_path(model_bin).suffix == '.bin':
+            raise ConfigError('{} format not supported'.format(model_bin))
+        return str(model_xml), str(model_bin)
+
+    def predict(self, idenitifers, input_data):
+        raise NotImplementedError
+
+    def release(self):
+        pass
+
+
+class ColorizationTestModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__()
+        model_xml, model_bin = self.check_format(network_info['model'], network_info['weights'])
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        self.network.batch_size = 1
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin()
+        self.exec_network = launcher.plugin.load(self.network)
+        self.input_blob = next(iter(self.network.inputs))
+        self.output_blob = next(iter(self.network.outputs))
+        self.color_coeff = np.load(network_info['color_coeff'])
+
+    def data_preparation(self, input_data):
+        input = input_data[0].astype(np.float32)
+        img_lab = cv2.cvtColor(input, cv2.COLOR_RGB2Lab)
+        img_l = np.copy(img_lab[:, :, 0])
+        img_l_rs = np.copy(img_lab[:, :, 0])
+        return img_l, img_l_rs
+
+    def postprocessing(self, res, img_l, output_blob, img_size):
+        update_res = (res[output_blob] * self.color_coeff.transpose()[:, :, np.newaxis, np.newaxis]).sum(1)
+
+        out = update_res.transpose((1, 2, 0)).astype(np.float32)
+        out = cv2.resize(out, img_size)
+        img_lab_out = np.concatenate((img_l[:, :, np.newaxis], out), axis=2)
+        new_result = [np.clip(cv2.cvtColor(img_lab_out, cv2.COLOR_Lab2BGR), 0, 1)]
+        return new_result
+
+    def predict(self, identifiers, input_data):
+        img_l, img_l_rs = self.data_preparation(input_data)
+
+        output_blob = next(iter(self.exec_network.outputs))
+        h_orig, w_orig = input_data[0].shape[:2]
+        res = self.exec_network.infer(inputs={self.input_blob: [img_l_rs]})
+
+        new_result = self.postprocessing(res, img_l, output_blob, (w_orig, h_orig))
+        return np.array(new_result)
+
+    def release(self):
+        del self.exec_network
+
+    def fit_to_input(self, input_data):
+        input_data = np.reshape(input_data, self.network.inputs[self.input_blob].shape)
+        return {self.input_blob: input_data}
+
+
+class ColorizationCheckModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__()
+        model_xml, model_bin = self.check_format(network_info['model'], network_info['weights'])
+        self.adapter = create_adapter(network_info['adapter'])
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        if hasattr(launcher, 'plugin'):
+            self.exec_network = launcher.plugin.load(self.network)
+        else:
+            launcher.load_network(self.network)
+            self.exec_network = launcher.exec_network
+        self.input_blob = next(iter(self.network.inputs))
+        self.output_blob = next(iter(self.network.outputs))
+        self.adapter.output_blob = self.output_blob
+
+    def predict(self, identifiers, input_data):
+        result = self.exec_network.infer(self.fit_to_input(input_data))
+        result = self.adapter.process([result], identifiers, [{}])
+        return result
+
+    def release(self):
+        del self.exec_network
+
+    def fit_to_input(self, input_data):
+        constant_normalization = 255.
+        input_data *= constant_normalization
+        input_data = np.transpose(input_data, (0, 3, 1, 2))
+        return {self.input_blob: input_data}
diff --git a/tools/accuracy_checker/custom_evaluators/mtcnn_evaluator.py b/tools/accuracy_checker/custom_evaluators/mtcnn_evaluator.py
new file mode 100644
index 00000000000..5ab45ff10c2
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/mtcnn_evaluator.py
@@ -0,0 +1,675 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import copy
+from collections import OrderedDict
+import pickle
+from pathlib import Path
+import numpy as np
+import cv2
+
+from accuracy_checker.evaluators import BaseEvaluator
+from accuracy_checker.adapters import create_adapter
+from accuracy_checker.launcher import create_launcher, InputFeeder
+from accuracy_checker.dataset import Dataset
+from accuracy_checker.data_readers import BaseReader, REQUIRES_ANNOTATIONS
+from accuracy_checker.preprocessor import PreprocessingExecutor
+from accuracy_checker.utils import extract_image_representations, read_pickle
+from accuracy_checker.adapters import MTCNNPAdapter
+from accuracy_checker.metrics import MetricsExecutor
+from accuracy_checker.postprocessor import PostprocessingExecutor
+from accuracy_checker.config import ConfigError
+
+
+def build_stages(models_info, preprocessors_config, launcher):
+    def merge_preprocessing(model_specific, common_preprocessing):
+        if model_specific:
+            model_specific.extend(common_preprocessing)
+            return model_specific
+        return common_preprocessing
+
+    required_stages = ['pnet']
+    stages_mapping = OrderedDict([
+        ('pnet', {'caffe': CaffeProposalStage, 'dlsdk': DLSDKProposalStage, 'dummy': DummyProposalStage}),
+        ('rnet', {'caffe': CaffeRefineStage, 'dlsdk': DLSDKRefineStage}),
+        ('onet', {'caffe': CaffeOutputStage,'dlsdk': DLSDKOutputStage})
+    ])
+    framework = launcher.config['framework']
+    stages = []
+    for stage_name, stage_classes in stages_mapping.items():
+        if stage_name not in models_info:
+            if stage_name not in required_stages:
+                continue
+            else:
+                raise ConfigError('{} required for evaluation'.format(stage_name))
+        model_config = models_info[stage_name]
+        if 'predictions' in model_config and not model_config.get('store_predictions', False):
+            stage_framework = 'dummy'
+        else:
+            stage_framework = framework
+        stage = stage_classes.get(stage_framework)
+        if not stage_classes:
+            raise ConfigError('{} stage does not support {} framework'.format(stage_name, stage_framework))
+        stage_preprocess = merge_preprocessing(models_info[stage_name].get('preprocessing', []), preprocessors_config)
+        preprocessor = PreprocessingExecutor(stage_preprocess)
+        stages.append(stage(models_info[stage_name], preprocessor, launcher))
+
+    if not stages:
+        raise ConfigError('please provide information about MTCNN pipeline stages')
+    return stages
+
+
+class BaseStage:
+    def __init__(self, model_info, preprocessor):
+        self.model_info = model_info
+        self.preprocessor = preprocessor
+        self.input_feeder = None
+        self.store = model_info.get('store_predictions', False)
+        self.predictions = []
+
+    def predict(self, input_blobs, batch_meta):
+        raise NotImplementedError
+
+    def preprocess_data(self, batch_input, batch_annotation, previous_stage_prediction, *args, **kwargs):
+        raise NotImplementedError
+
+    def postprocess_result(self, identifiers, this_stage_result, batch_meta, previous_stage_result, *args, **kwargs):
+        raise NotImplementedError
+
+    def release(self):
+        pass
+
+    def reset(self):
+        self._predictions = []
+
+    def dump_predictions(self):
+        if not hasattr(self, 'prediction_file'):
+            prediction_file = Path(self.model_info.get('predictions', 'predictions.pickle'))
+            self.prediction_file = prediction_file
+        with self.prediction_file.open('wb') as out_file:
+            pickle.dump(self._predictions, out_file)
+
+
+class ProposalBaseStage(BaseStage):
+    def __init__(self, model_info, preprocessor):
+        super().__init__(model_info, preprocessor)
+        self.adapter = None
+        self.input_feeder = None
+        self._predictions = []
+
+    def preprocess_data(self, batch_input, batch_annotation, *args, **kwargs):
+        batch_input = self.preprocessor.process(batch_input, batch_annotation)
+        _, batch_meta = extract_image_representations(batch_input)
+        filled_inputs = self.input_feeder.fill_inputs(batch_input) if self.input_feeder else batch_input
+        return filled_inputs, batch_meta
+
+    def postprocess_result(self, identifiers, this_stage_result, batch_meta, *args, **kwargs):
+        result = self.adapter.process(this_stage_result, identifiers, batch_meta) if self.adapter else this_stage_result
+        if self.store:
+            self._predictions.extend(result)
+        return result
+
+    def _infer(self, input_blobs, batch_meta):
+        raise NotImplementedError
+
+    def predict(self, input_blobs, batch_meta):
+        return self._infer(input_blobs, batch_meta)
+
+    def dump_predictions(self):
+        if not hasattr(self, 'prediction_file'):
+            prediction_file = Path(self.model_info.get('predictions', 'pnet_predictions.pickle'))
+            self.prediction_file = prediction_file
+        with self.prediction_file.open('wb') as out_file:
+            pickle.dump(self._predictions, out_file)
+
+
+class DummyProposalStage(ProposalBaseStage):
+    def __init__(self, model_info, preprocessor, *args, **kwargs):
+        super().__init__(model_info, preprocessor)
+        self._index = 0
+        if 'predictions' not in self.model_info:
+            raise ConfigError('predictions_file is not found')
+        self._predictions = read_pickle(self.model_info['predictions'])
+        self.iterator = 0
+
+    def preprocess_data(self, batch_input, batch_annotation, *args, **kwargs):
+        _, batch_meta = extract_image_representations(batch_input)
+        return batch_input, batch_meta
+
+    def _infer(self, input_blobs, batch_meta):
+        batch_size = len(batch_meta)
+        results = self._predictions[self._index:self._index+batch_size]
+        self._index += batch_size
+        return results
+
+    def postprocess_result(self, identifiers, this_stage_result, batch_meta, *args, **kwargs):
+        return this_stage_result
+
+
+class RefineBaseStage(BaseStage):
+    input_size = 24
+    include_boundaries = True
+
+    def preprocess_data(self, batch_input, batch_annotation, previous_stage_prediction, *lrgs, **kwargs):
+        batch_input = self.preprocessor.process(batch_input, batch_annotation)
+        _, batch_meta = extract_image_representations(batch_input)
+        batch_input = [
+            cut_roi(input_image, prediction, self.input_size, include_bound=self.include_boundaries)
+            for input_image, prediction in zip(batch_input, previous_stage_prediction)
+        ]
+        filled_inputs = self.input_feeder.fill_inputs(batch_input) if self.input_feeder else batch_input
+        return filled_inputs, batch_meta
+
+    def postprocess_result(self, identifiers, this_stage_result, batch_meta, previous_stage_result, *args, **kwargs):
+        result = calibrate_predictions(
+            previous_stage_result, this_stage_result, 0.7, self.model_info['outputs'], 'Union'
+        )
+        if self.store:
+            self._predictions.extend(result)
+        return result
+
+    def _infer(self, input_blobs, batch_meta):
+        raise NotImplementedError
+
+    def predict(self, input_blobs, batch_meta):
+        return self._infer(input_blobs, batch_meta)
+
+    def dump_predictions(self):
+        if not hasattr(self, 'prediction_file'):
+            prediction_file = Path(self.model_info.get('predictions', 'rnet_predictions.pickle'))
+            self.prediction_file = prediction_file
+        with self.prediction_file.open('wb') as out_file:
+            pickle.dump(self._predictions, out_file)
+
+
+class OutputBaseStage(RefineBaseStage):
+    input_size = 48
+    include_boundaries = False
+
+    def postprocess_result(self, identifiers, this_stage_result, batch_meta, previous_stage_result, *args, **kwargs):
+        batch_predictions = calibrate_predictions(
+            previous_stage_result, this_stage_result, 0.7, self.model_info['outputs']
+        )
+        batch_predictions[0], _ = nms(batch_predictions[0], 0.7, 'Min')
+        if self.store:
+            self._predictions.extend(batch_predictions)
+        return batch_predictions
+
+    def dump_predictions(self):
+        if not hasattr(self, 'prediction_file'):
+            prediction_file = Path(self.model_info.get('predictions', 'onet_predictions.pickle'))
+            self.prediction_file = prediction_file
+        with self.prediction_file.open('wb') as out_file:
+            pickle.dump(self._predictions, out_file)
+
+
+class CaffeModelMixin:
+    def _infer(self, input_blobs, batch_meta):
+        for meta in batch_meta:
+            meta['input_shape'] = []
+        results = []
+        for feed_dict in input_blobs:
+            for layer_name, data in feed_dict.items():
+                if data.shape != self.inputs[layer_name]:
+                    self.net.blobs[layer_name].reshape(*data.shape)
+            for meta in batch_meta:
+                meta['input_shape'].append(self.inputs)
+            results.append(self.net.forward(**feed_dict))
+
+        return results
+
+    @property
+    def inputs(self):
+        inputs_map = {}
+        for input_blob in self.net.inputs:
+            inputs_map[input_blob] = self.net.blobs[input_blob].data.shape
+
+        return inputs_map
+
+    def release(self):
+        del self.net
+
+    def fit_to_input(self, data, layer_name, layout, precision):
+        data_shape = np.shape(data)
+        layer_shape = self.inputs[layer_name]
+        if len(data_shape) == 5 and len(layer_shape) == 4:
+            data = data[0]
+            data_shape = np.shape(data)
+        data = np.transpose(data, layout) if len(data_shape) == 4 else np.array(data)
+        if precision:
+            data = data.astype(precision)
+
+        return data
+
+
+class DLSDKModelMixin:
+    def _infer(self, input_blobs, batch_meta):
+        for meta in batch_meta:
+            meta['input_shape'] = []
+        results = []
+        for feed_dict in input_blobs:
+            input_shapes = {layer_name: data.shape for layer_name, data in feed_dict.items()}
+            self._reshape_input(input_shapes)
+            results.append(self.exec_network.infer(feed_dict))
+            for meta in batch_meta:
+                meta['input_shape'].append(self.inputs)
+
+        return results
+
+    def _reshape_input(self, input_shapes):
+        del self.exec_network
+        self.network.reshape(input_shapes)
+        self.exec_network = self.launcher.plugin.load(network=self.network)
+
+    @property
+    def inputs(self):
+        return self.network.inputs
+
+    def release(self):
+        del self.network
+        del self.exec_network
+        self.launcher.release()
+
+    def fit_to_input(self, data, layer_name, layout, precision):
+        layer_shape = tuple(self.inputs[layer_name].shape)
+        data_shape = np.shape(data)
+        if len(layer_shape) == 4:
+            if len(data_shape) == 5:
+                data = data[0]
+            data = np.transpose(data, layout)
+        if precision:
+            data = data.astype(precision)
+
+        return data
+
+    def prepare_model(self, launcher):
+        launcher_specific_entries = [
+            'model', 'weights', 'caffe_model', 'caffe_weights', 'tf_model', 'inputs', 'outputs', '_model_optimizer'
+        ]
+
+        def update_mo_params(launcher_config, model_config):
+            for entry in launcher_specific_entries:
+                if entry not in launcher_config:
+                    continue
+                if entry in model_config:
+                    continue
+                model_config[entry] = launcher_config[entry]
+            model_mo_flags, model_mo_params = model_config.get('mo_flags', []), model_config.get('mo_params', {})
+            launcher_mo_flags, launcher_mo_params = launcher_config.get('mo_flags', []), launcher_config.get(
+                'mo_params', {})
+            for launcher_flag in launcher_mo_flags:
+                if launcher_flag not in model_mo_flags:
+                    model_mo_flags.append(launcher_flag)
+
+            for launcher_mo_key, launcher_mo_value in launcher_mo_params.items():
+                if launcher_mo_key not in launcher_mo_params:
+                    model_mo_params[launcher_mo_key] = launcher_mo_value
+
+            model_config['mo_flags'] = model_mo_flags
+            model_config['mo_params'] = model_mo_params
+
+        update_mo_params(launcher.config, self.model_info)
+        if 'caffe_model' in self.model_info:
+            self.model_info.update(launcher.config)
+            model_xml, model_bin = launcher.convert_model(self.model_info)
+        else:
+            model_xml = self.model_info['model']
+            model_bin = self.model_info['weights']
+
+        return model_xml, model_bin
+
+
+class CaffeProposalStage(CaffeModelMixin, ProposalBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info, preprocessor)
+        self.net = launcher.create_network(self.model_info['model'], self.model_info['weights'])
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs, self.fit_to_input)
+        pnet_outs = model_info['outputs']
+        pnet_adapter_config = launcher.config.get('adapter', {'type': 'mtcnn_p', **pnet_outs})
+        pnet_adapter_config.update({'regions_format': 'hw'})
+        self.adapter = create_adapter(pnet_adapter_config)
+
+
+class CaffeRefineStage(CaffeModelMixin, RefineBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info, preprocessor)
+        self.net = launcher.create_network(self.model_info['model'], self.model_info['weights'])
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs,  self.fit_to_input)
+
+
+class CaffeOutputStage(CaffeModelMixin, OutputBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info, preprocessor)
+        self.net = launcher.create_network(self.model_info['model'], self.model_info['weights'])
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs, self.fit_to_input)
+
+
+class DLSDKProposalStage(DLSDKModelMixin, ProposalBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info, preprocessor)
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin(True)
+        model_xml, model_bin = self.prepare_model(launcher)
+        self.network = launcher.create_ie_network(str(model_xml), str(model_bin))
+        self.exec_network = launcher.plugin.load(self.network)
+        self.launcher = launcher
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs, self.fit_to_input)
+        pnet_outs = model_info['outputs']
+        pnet_adapter_config = launcher.config.get('adapter', {'type': 'mtcnn_p', **pnet_outs})
+        # pnet_adapter_config.update({'regions_format': 'hw'})
+        self.adapter = create_adapter(pnet_adapter_config)
+
+
+class DLSDKRefineStage(DLSDKModelMixin, RefineBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info, preprocessor)
+
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin(True)
+        model_xml, model_bin = self.prepare_model(launcher)
+        self.network = launcher.create_ie_network(str(model_xml), str(model_bin))
+        self.exec_network = launcher.plugin.load(self.network)
+        self.launcher = launcher
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs, self.fit_to_input)
+
+
+class DLSDKOutputStage(DLSDKModelMixin, OutputBaseStage):
+    def __init__(self,  model_info, preprocessor, launcher):
+        super().__init__(model_info,  preprocessor)
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin(True)
+        model_xml, model_bin = self.prepare_model(launcher)
+        self.network = launcher.create_ie_network(str(model_xml), str(model_bin))
+        self.exec_network = launcher.plugin.load(self.network)
+        self.launcher = launcher
+        self.input_feeder = InputFeeder(model_info.get('inputs', []), self.inputs, self.fit_to_input)
+
+
+class MTCNNEvaluator(BaseEvaluator):
+    def __init__(
+            self, dataset, reader, stages, postprocessing, metrics_executor
+    ):
+        super().__init__()
+        self.dataset = dataset
+        self.reader = reader
+        self.stages = stages
+        self.postprocessing = postprocessing
+        self.metrics_executor = metrics_executor
+        self._metrics_results = []
+        self._annotations, self._predictions = [], []
+
+    def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs):
+        def no_detections(batch_pred):
+            return batch_pred[0].size == 0
+        if progress_reporter:
+            progress_reporter.reset(self.dataset.size)
+        for batch_id, (_, batch_annotation) in enumerate(self.dataset):
+            batch_identifiers = [annotation.identifier for annotation in batch_annotation]
+            batch_input = [self.reader(identifier=identifier) for identifier in batch_identifiers]
+            batch_predictions = []
+            for stage in self.stages:
+                previous_stage_predictions = batch_predictions
+                filled_inputs, batch_meta = stage.preprocess_data(copy.deepcopy(batch_input), batch_annotation, previous_stage_predictions)
+                batch_predictions = stage.predict(filled_inputs, batch_meta)
+                batch_predictions = stage.postprocess_result(
+                    batch_identifiers, batch_predictions, batch_meta, previous_stage_predictions
+                )
+                if no_detections(batch_predictions):
+                    break
+
+            batch_annotation, batch_predictions = self.postprocessing.process_batch(batch_annotation, batch_predictions)
+
+            self._annotations.extend(batch_annotation)
+            self._predictions.extend(batch_predictions)
+            if progress_reporter:
+                progress_reporter.update(batch_id, len(batch_predictions))
+        for stage in self.stages:
+            if stage.store:
+                stage.dump_predictions()
+
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        if self._metrics_results:
+            del self._metrics_results
+            self._metrics_results = []
+
+        for result_presenter, evaluated_metric in self.metrics_executor.iterate_metrics(
+                self._annotations, self._predictions):
+            self._metrics_results.append(evaluated_metric)
+            if print_results:
+                result_presenter.write_result(evaluated_metric, ignore_results_formatting)
+
+        return self._metrics_results
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(False, ignore_results_formatting)
+
+        result_presenters = self.metrics_executor.get_metric_presenters()
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
+            return
+        result_presenters = self.metrics_executor.get_metric_presenters()
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            presenter.write_result(metric_result, ignore_results_formatting)
+
+    @classmethod
+    def from_configs(cls, config):
+        dataset_config = config['datasets'][0]
+        dataset = Dataset(dataset_config)
+        data_reader_config = dataset_config.get('reader', 'opencv_imread')
+        data_source = dataset_config['data_source']
+        if isinstance(data_reader_config, str):
+            data_reader_type = data_reader_config
+            data_reader_config = None
+        elif isinstance(data_reader_config, dict):
+            data_reader_type = data_reader_config['type']
+        else:
+            raise ConfigError('reader should be dict or string')
+        if data_reader_type in REQUIRES_ANNOTATIONS:
+            data_source = dataset.annotation
+        data_reader = BaseReader.provide(data_reader_type, data_source, data_reader_config)
+        models_info = config['network_info']
+        launcher_config = config['launchers'][0]
+        launcher = create_launcher(launcher_config, delayed_model_loading=True)
+        preprocessors_config = dataset_config.get('preprocessing', [])
+        stages = build_stages(models_info, preprocessors_config, launcher)
+        metrics_executor = MetricsExecutor(dataset_config['metrics'], dataset)
+        postprocessing = PostprocessingExecutor(dataset_config['postprocessing'])
+
+        return cls(dataset, data_reader, stages, postprocessing, metrics_executor)
+
+    @staticmethod
+    def get_processing_info(config):
+        module_specific_params = config.get('module_config')
+        model_name = config['name']
+        dataset_config = module_specific_params['datasets'][0]
+        launcher_config = module_specific_params['launchers'][0]
+        return (
+            model_name, launcher_config['framework'], launcher_config['device'], launcher_config.get('tags'),
+            dataset_config['name']
+        )
+
+    def release(self):
+        for stage in self.stages:
+            stage.release()
+
+    def reset(self):
+        self.metrics_executor.reset()
+        self.dataset.reset()
+        for stage in self.stages:
+            stage.reset()
+
+
+def calibrate_predictions(previous_stage_predictions, out, threshold, outputs_mapping, iou_type=None):
+    score = out[0][outputs_mapping['probability_out']][:, 1]
+    pass_t = np.where(score > 0.7)[0]
+    removed_boxes = [i for i in range(previous_stage_predictions[0].size) if i not in pass_t]
+    previous_stage_predictions[0].remove(removed_boxes)
+    previous_stage_predictions[0].scores = score[pass_t]
+    bboxes = np.c_[
+        previous_stage_predictions[0].x_mins, previous_stage_predictions[0].y_mins,
+        previous_stage_predictions[0].x_maxs, previous_stage_predictions[0].y_maxs,
+        previous_stage_predictions[0].scores
+    ]
+    mv = out[0][outputs_mapping['region_out']][pass_t]
+    if iou_type:
+        previous_stage_predictions[0], peek = nms(previous_stage_predictions[0], threshold, iou_type)
+        bboxes = np.c_[
+            previous_stage_predictions[0].x_mins, previous_stage_predictions[0].y_mins,
+            previous_stage_predictions[0].x_maxs, previous_stage_predictions[0].y_maxs,
+            previous_stage_predictions[0].scores
+        ]
+        mv = mv[np.sort(peek).astype(int)]
+    bboxes = bbreg(bboxes, mv.T)
+    x_mins, y_mins, x_maxs, y_maxs, _ = bboxes.T
+    previous_stage_predictions[0].x_mins = x_mins
+    previous_stage_predictions[0].y_mins = y_mins
+    previous_stage_predictions[0].x_maxs = x_maxs
+    previous_stage_predictions[0].y_maxs = y_maxs
+
+    return previous_stage_predictions
+
+
+def nms(prediction, threshold, iou_type):
+    bboxes = np.c_[
+        prediction.x_mins, prediction.y_mins,
+        prediction.x_maxs, prediction.y_maxs,
+        prediction.scores
+    ]
+    peek = MTCNNPAdapter.nms(bboxes, threshold, iou_type)
+    prediction.remove([i for i in range(prediction.size) if i not in peek])
+
+    return prediction, peek
+
+
+def bbreg(boundingbox, reg):
+    reg = reg.T
+
+    # calibrate bounding boxes
+    w = boundingbox[:, 2] - boundingbox[:, 0] + 1
+    h = boundingbox[:, 3] - boundingbox[:, 1] + 1
+
+    bb0 = boundingbox[:, 0] + reg[:, 0] * w
+    bb1 = boundingbox[:, 1] + reg[:, 1] * h
+    bb2 = boundingbox[:, 2] + reg[:, 2] * w
+    bb3 = boundingbox[:, 3] + reg[:, 3] * h
+
+    boundingbox[:, 0:4] = np.array([bb0, bb1, bb2, bb3]).T
+
+    return boundingbox
+
+
+def pad(boxesA, h, w):
+    boxes = boxesA.copy()
+
+    tmph = boxes[:, 3] - boxes[:, 1] + 1
+    tmpw = boxes[:, 2] - boxes[:, 0] + 1
+    numbox = boxes.shape[0]
+
+    dx = np.ones(numbox)
+    dy = np.ones(numbox)
+    edx = tmpw
+    edy = tmph
+
+    x = boxes[:, 0:1][:, 0]
+    y = boxes[:, 1:2][:, 0]
+    ex = boxes[:, 2:3][:, 0]
+    ey = boxes[:, 3:4][:, 0]
+
+    tmp = np.where(ex > w)[0]
+    if tmp.shape[0] != 0:
+        edx[tmp] = -ex[tmp] + w - 1 + tmpw[tmp]
+        ex[tmp] = w - 1
+
+    tmp = np.where(ey > h)[0]
+    if tmp.shape[0] != 0:
+        edy[tmp] = -ey[tmp] + h - 1 + tmph[tmp]
+        ey[tmp] = h - 1
+
+    tmp = np.where(x < 1)[0]
+    if tmp.shape[0] != 0:
+        dx[tmp] = 2 - x[tmp]
+        x[tmp] = np.ones_like(x[tmp])
+
+    tmp = np.where(y < 1)[0]
+    if tmp.shape[0] != 0:
+        dy[tmp] = 2 - y[tmp]
+        y[tmp] = np.ones_like(y[tmp])
+
+    # for python index from 0, while matlab from 1
+    dy = np.maximum(0, dy - 1)
+    dx = np.maximum(0, dx - 1)
+    y = np.maximum(0, y - 1)
+    x = np.maximum(0, x - 1)
+    edy = np.maximum(0, edy - 1)
+    edx = np.maximum(0, edx - 1)
+    ey = np.maximum(0, ey - 1)
+    ex = np.maximum(0, ex - 1)
+    return [dy, edy, dx, edx, y, ey, x, ex, tmpw, tmph]
+
+
+def rerec(bboxA):
+    w = bboxA[:, 2] - bboxA[:, 0]
+    h = bboxA[:, 3] - bboxA[:, 1]
+    l = np.maximum(w, h).T
+
+    bboxA[:, 0] = bboxA[:, 0] + w * 0.5 - l * 0.5
+    bboxA[:, 1] = bboxA[:, 1] + h * 0.5 - l * 0.5
+    bboxA[:, 2:4] = bboxA[:, 0:2] + np.repeat([l], 2, axis=0).T
+
+    return bboxA
+
+
+def cut_roi(image, prediction, dst_size, include_bound=True):
+    bboxes = np.c_[
+        prediction.x_mins, prediction.y_mins,
+        prediction.x_maxs, prediction.y_maxs,
+        prediction.scores
+    ]
+    img = image.data
+    bboxes = rerec(bboxes)
+    bboxes[:, 0:4] = np.fix(bboxes[:, 0:4])
+    dy, edy, dx, edx, y, ey, x, ex, tmpw, tmph = pad(bboxes, *img.shape[:2])
+    numbox = bboxes.shape[0]
+    tempimg = np.zeros((numbox, dst_size, dst_size, 3))
+    for k in range(numbox):
+        tmp_k_h = int(tmph[k]) + int(include_bound)
+        tmp_k_w = int(tmpw[k]) + int(include_bound)
+        tmp = np.zeros((tmp_k_h, tmp_k_w, 3))
+        tmp_ys = slice(int(dy[k]), int(edy[k]) + 1)
+        tmp_xs = slice(int(dx[k]), int(edx[k]) + 1)
+        img_ys = slice(int(y[k]), int(ey[k]) + 1)
+        img_xs = slice(int(x[k]), int(ex[k]) + 1)
+        tmp[tmp_ys, tmp_xs] = img[img_ys, img_xs]
+        tempimg[k, :, :, :] = cv2.resize(tmp, (dst_size, dst_size))
+    image.data = tempimg
+
+    return image
diff --git a/tools/accuracy_checker/custom_evaluators/sequential_action_recognition_evaluator.py b/tools/accuracy_checker/custom_evaluators/sequential_action_recognition_evaluator.py
new file mode 100644
index 00000000000..6e16105cbeb
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/sequential_action_recognition_evaluator.py
@@ -0,0 +1,393 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+from pathlib import Path
+import pickle
+import numpy as np
+from accuracy_checker.evaluators import BaseEvaluator
+from accuracy_checker.dataset import Dataset
+from accuracy_checker.adapters import create_adapter
+from accuracy_checker.data_readers import BaseReader
+from accuracy_checker.config import ConfigError
+from accuracy_checker.preprocessor import PreprocessingExecutor
+from accuracy_checker.metrics import MetricsExecutor
+from accuracy_checker.launcher import create_launcher
+from accuracy_checker.utils import contains_all, extract_image_representations, read_pickle
+
+
+class SequentialActionRecognitionEvaluator(BaseEvaluator):
+    def __init__(self, dataset, reader, preprocessing, metric_executor, launcher, model):
+        self.dataset = dataset
+        self.preprocessing_executor = preprocessing
+        self.metric_executor = metric_executor
+        self.launcher = launcher
+        self.model = model
+        self.reader = reader
+        self._metrics_results = []
+
+    @classmethod
+    def from_configs(cls, config):
+        dataset_config = config['datasets'][0]
+        dataset = Dataset(dataset_config)
+        data_reader_config = dataset_config.get('reader', 'opencv_imread')
+        data_source = dataset_config['data_source']
+        if isinstance(data_reader_config, str):
+            reader = BaseReader.provide(data_reader_config, data_source)
+        elif isinstance(data_reader_config, dict):
+            reader = BaseReader.provide(data_reader_config['type'], data_source, data_reader_config)
+        else:
+            raise ConfigError('reader should be dict or string')
+        preprocessing = PreprocessingExecutor(dataset_config.get('preprocessing', []), dataset.name)
+        metrics_executor = MetricsExecutor(dataset_config['metrics'], dataset)
+        launcher = create_launcher(config['launchers'][0], delayed_model_loading=True)
+        model = SequentialModel(config.get('network_info', {}), launcher)
+        return cls(dataset, reader, preprocessing, metrics_executor, launcher, model)
+
+    def process_dataset(self, stored_predictions, progress_reporter, *args, ** kwargs):
+        self._annotations, self._predictions = ([], []) if self.metric_executor.need_store_predictions else None, None
+        if progress_reporter:
+            progress_reporter.reset(self.dataset.size)
+
+        for batch_id, (dataset_indices, batch_annotation) in enumerate(self.dataset):
+            batch_identifiers = [annotation.identifier for annotation in batch_annotation]
+            batch_input = [self.reader(identifier=identifier) for identifier in batch_identifiers]
+            batch_input = self.preprocessing_executor.process(batch_input, batch_annotation)
+            batch_input, _ = extract_image_representations(batch_input)
+            batch_prediction = self.model.predict(batch_identifiers, batch_input)
+            self.metric_executor.update_metrics_on_batch(dataset_indices, batch_annotation, batch_prediction)
+            if self.metric_executor.need_store_predictions:
+                self._annotations.extend(batch_annotation)
+                self._predictions.extend(batch_prediction)
+            progress_reporter.update(batch_id, len(batch_prediction))
+
+        if progress_reporter:
+            progress_reporter.finish()
+
+        if self.model.store_encoder_predictions:
+            self.model.save_encoder_predictions()
+
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        if self._metrics_results:
+            del self._metrics_results
+            self._metrics_results = []
+
+        for result_presenter, evaluated_metric in self.metric_executor.iterate_metrics(
+                self._annotations, self._predictions):
+            self._metrics_results.append(evaluated_metric)
+            if print_results:
+                result_presenter.write_result(evaluated_metric, ignore_results_formatting)
+
+        return self._metrics_results
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(False, ignore_results_formatting)
+
+        result_presenters = self.metric_executor.get_metric_presenters()
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
+            return
+        result_presenters = self.metric_executor.get_metric_presenters()
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            presenter.write_result(metric_result, ignore_results_formatting)
+
+    def release(self):
+        self.model.release()
+        self.launcher.release()
+
+    def reset(self):
+        self.metric_executor.reset()
+        self.model.reset()
+
+    @staticmethod
+    def get_processing_info(config):
+        module_specific_params = config.get('module_config')
+        model_name = config['name']
+        dataset_config = module_specific_params['datasets'][0]
+        launcher_config = module_specific_params['launchers'][0]
+        return (
+            model_name, launcher_config['framework'], launcher_config['device'], launcher_config.get('tags'),
+            dataset_config['name']
+        )
+
+
+class BaseModel:
+    def __init__(self, network_info, launcher):
+        self.network_info = network_info
+
+    def predict(self, idenitifers, input_data):
+        raise NotImplementedError
+
+    def release(self):
+        pass
+
+
+def create_encoder(model_config, launcher):
+    launcher_model_mapping = {
+        'dlsdk': EncoderDLSDKModel,
+        'onnx_runtime': EncoderONNXModel,
+        'opencv': EncoderOpenCVModel,
+        'dummy': DummyEncoder
+    }
+    framework = launcher.config['framework']
+    if 'predictions' in model_config and not model_config.get('store_predictions', False):
+        framework = 'dummy'
+    model_class = launcher_model_mapping.get(framework)
+    if not model_class:
+        raise ValueError('model for framework {} is not supported'.format(framework))
+    return model_class(model_config, launcher)
+
+
+def create_decoder(model_config, launcher):
+    launcher_model_mapping = {
+        'dlsdk': DecoderDLSDKModel,
+        'onnx_runtime': DecoderONNXModel,
+        'opencv': DecoderOpenCVModel,
+    }
+    framework = launcher.config['framework']
+    model_class = launcher_model_mapping.get(framework)
+    if not model_class:
+        raise ValueError('model for framework {} is not supported'.format(framework))
+    return model_class(model_config, launcher)
+
+
+class SequentialModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        if not contains_all(network_info, ['encoder', 'decoder']):
+            raise ConfigError('network_info should contains encoder and decoder fields')
+        self.num_processing_frames = network_info['decoder'].get('num_processing_frames', 16)
+        self.processing_frames_buffer = []
+        self.encoder = create_encoder(network_info['encoder'], launcher)
+        self.decoder = create_decoder(network_info['decoder'], launcher)
+        self.store_encoder_predictions = network_info['encoder'].get('store_predictions', False)
+        self._encoder_predictions = [] if self.store_encoder_predictions else None
+
+    def predict(self, idenitifiers, input_data):
+        predictions = []
+        if len(np.shape(input_data)) == 5:
+            input_data = input_data[0]
+        for data in input_data:
+            encoder_prediction = self.encoder.predict(idenitifiers, [data])
+            self.processing_frames_buffer.append(encoder_prediction)
+            if self.store_encoder_predictions:
+                self._encoder_predictions.append(encoder_prediction)
+            if len(self.processing_frames_buffer) == self.num_processing_frames:
+                predictions.append(self.decoder.predict(idenitifiers, [self.processing_frames_buffer]))
+                self.processing_frames_buffer = []
+
+        return predictions
+
+    def reset(self):
+        self.processing_frames_buffer = []
+        if self._encoder_predictions is not None:
+            self._encoder_predictions = []
+
+    def release(self):
+        self.encoder.release()
+        self.decoder.release()
+
+    def save_encoder_predictions(self):
+        if self._encoder_predictions is not None:
+            prediction_file = Path(self.network_info['encoder'].get('predictions', 'encoder_predictions.pickle'))
+            with prediction_file.open('wb') as file:
+                pickle.dump(self._encoder_predictions, file)
+
+
+class EncoderDLSDKModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        if 'onnx_model' in network_info:
+            network_info.update(launcher.config)
+            model_xml, model_bin = launcher.convert_model(network_info)
+        else:
+            model_xml = str(network_info['model'])
+            model_bin = str(network_info['weights'])
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin()
+        self.exec_network = launcher.plugin.load(self.network)
+        self.input_blob = next(iter(self.network.inputs))
+        self.output_blob = next(iter(self.network.outputs))
+
+    def predict(self, identifiers, input_data):
+        return self.exec_network.infer(self.fit_to_input(input_data))[self.output_blob]
+
+    def release(self):
+        del self.exec_network
+
+    def fit_to_input(self, input_data):
+        input_data = np.transpose(input_data, (0, 3, 1, 2))
+        input_data = input_data.reshape(self.network.inputs[self.input_blob].shape)
+
+        return {self.input_blob: input_data}
+
+
+class DecoderDLSDKModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        if 'onnx_model' in network_info:
+            network_info.update(launcher.config)
+            model_xml, model_bin = launcher.convert_model(network_info)
+        else:
+            model_xml = str(network_info['model'])
+            model_bin = str(network_info['weights'])
+
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        if hasattr(launcher, 'plugin'):
+            self.exec_network = launcher.plugin.load(self.network)
+        else:
+            launcher.load_network(self.network)
+            self.exec_network = launcher.exec_network
+        self.input_blob = next(iter(self.network.inputs))
+        self.output_blob = next(iter(self.network.outputs))
+        self.adapter = create_adapter('classification')
+        self.adapter.output_blob = self.output_blob
+        self.num_processing_frames = network_info.get('num_processing_frames', 16)
+
+    def predict(self, identifiers, input_data):
+        result = self.exec_network.infer(self.fit_to_input(input_data))
+        result = self.adapter.process([result], identifiers, [{}])
+
+        return result
+
+    def release(self):
+        del self.exec_network
+
+    def fit_to_input(self, input_data):
+        input_data = np.reshape(input_data, self.network.inputs[self.input_blob].shape)
+        return {self.input_blob: input_data}
+
+
+class EncoderONNXModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        self.inference_session = launcher.create_inference_session(network_info['model'])
+        self.input_blob = next(iter(self.inference_session.get_inputs()))
+        self.output_blob = next(iter(self.inference_session.get_outputs()))
+
+    def predict(self, identifiers, input_data):
+        return self.inference_session.run((self.output_blob.name, ), self.fit_to_input(input_data))[0]
+
+    def fit_to_input(self, input_data):
+        input_data = np.transpose(input_data, (0, 3, 1, 2))
+        input_data = input_data.reshape(self.input_blob.shape)
+
+        return {self.input_blob.name: input_data}
+
+    def release(self):
+        del self.inference_session
+
+
+class DecoderONNXModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        self.inference_session = launcher.create_inference_session(network_info['model'])
+        self.input_blob = next(iter(self.inference_session.get_inputs()))
+        self.output_blob = next(iter(self.inference_session.get_outputs()))
+        self.adapter = create_adapter('classification')
+        self.adapter.output_blob = self.output_blob.name
+        self.num_processing_frames = network_info.get('num_processing_frames', 16)
+
+    def predict(self, identifiers, input_data):
+        result = self.inference_session.run((self.output_blob.name,), self.fit_to_input(input_data))
+        return self.adapter.process([{self.output_blob.name: result[0]}], identifiers, [{}])
+
+    def fit_to_input(self, input_data):
+        input_data = np.reshape(input_data, self.input_blob.shape)
+        return {self.input_blob.name: input_data}
+
+    def release(self):
+        del self.inference_session
+
+
+class DummyEncoder(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        if 'predictions' not in network_info:
+            raise ConfigError('predictions_file is not found')
+        self._predictions = read_pickle(network_info['predictions'])
+        self.iterator = 0
+
+    def predict(self, idenitifers, input_data):
+        result = self._predictions[self.iterator]
+        self.iterator += 1
+        return result
+
+
+class EncoderOpenCVModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        self.network = launcher.create_network(network_info['model'], network_info.get('weights', ''))
+        network_info.update(launcher.config)
+        input_shapes = launcher.get_inputs_from_config(network_info)
+        self.input_blob = next(iter(input_shapes))
+        self.input_shape = input_shapes[self.input_blob]
+        self.network.setInputsNames(list(self.input_blob))
+        self.output_blob = next(iter(self.network.getUnconnectedOutLayersNames()))
+
+    def predict(self, identifiers, input_data):
+        self.network.setInput(self.fit_to_input(input_data)[self.input_blob], self.input_blob)
+        return self.network.forward([self.output_blob])[0]
+
+    def fit_to_input(self, input_data):
+        input_data = np.transpose(input_data, (0, 3, 1, 2))
+        input_data = input_data.reshape(self.input_shape)
+
+        return {self.input_blob: input_data.astype(np.float32)}
+
+    def release(self):
+        del self.network
+
+
+class DecoderOpenCVModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        self.network = launcher.create_network(network_info['model'], network_info.get('weights', ''))
+        input_shapes = launcher.get_inputs_from_config(network_info)
+        self.input_blob = next(iter(input_shapes))
+        self.input_shape = input_shapes[self.input_blob]
+        self.network.setInputsNames(list(self.input_blob))
+        self.output_blob = next(iter(self.network.getUnconnectedOutLayersNames()))
+        self.adapter = create_adapter('classification')
+        self.adapter.output_blob = self.output_blob
+        self.num_processing_frames = network_info.get('num_processing_frames', 16)
+
+    def predict(self, identifiers, input_data):
+        self.network.setInput(self.fit_to_input(input_data)[self.input_blob], self.input_blob)
+        result = self.network.forward([self.output_blob])[0]
+        return self.adapter.process([{self.output_blob.name: result}], identifiers, [{}])
+
+    def fit_to_input(self, input_data):
+        input_data = np.reshape(input_data, self.input_shape)
+        return {self.input_blob: input_data.astype(np.float32)}
+
+    def release(self):
+        del self.network
diff --git a/tools/accuracy_checker/custom_evaluators/text_spotting_evaluator.py b/tools/accuracy_checker/custom_evaluators/text_spotting_evaluator.py
new file mode 100644
index 00000000000..2fab2806828
--- /dev/null
+++ b/tools/accuracy_checker/custom_evaluators/text_spotting_evaluator.py
@@ -0,0 +1,292 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+import numpy as np
+
+from accuracy_checker.adapters import create_adapter
+from accuracy_checker.config import ConfigError
+from accuracy_checker.data_readers import BaseReader
+from accuracy_checker.dataset import Dataset
+from accuracy_checker.evaluators import BaseEvaluator
+from accuracy_checker.launcher import create_launcher
+from accuracy_checker.metrics import MetricsExecutor
+from accuracy_checker.preprocessor import PreprocessingExecutor
+from accuracy_checker.utils import contains_all, extract_image_representations
+
+
+class TextSpottingEvaluator(BaseEvaluator):
+    def __init__(self, dataset, reader, preprocessing, metric_executor, launcher, model):
+        self.dataset = dataset
+        self.preprocessing_executor = preprocessing
+        self.metric_executor = metric_executor
+        self.launcher = launcher
+        self.model = model
+        self.reader = reader
+        self._metrics_results = []
+
+    @classmethod
+    def from_configs(cls, config):
+        dataset_config = config['datasets'][0]
+        dataset = Dataset(dataset_config)
+        data_reader_config = dataset_config.get('reader', 'opencv_imread')
+        data_source = dataset_config['data_source']
+        if isinstance(data_reader_config, str):
+            reader = BaseReader.provide(data_reader_config, data_source)
+        elif isinstance(data_reader_config, dict):
+            reader = BaseReader.provide(data_reader_config['type'], data_source, data_reader_config)
+        else:
+            raise ConfigError('reader should be dict or string')
+        preprocessing = PreprocessingExecutor(dataset_config.get('preprocessing', []), dataset.name)
+        metrics_executor = MetricsExecutor(dataset_config['metrics'], dataset)
+        launcher = create_launcher(config['launchers'][0], delayed_model_loading=True)
+        model = SequentialModel(config.get('network_info', {}), launcher)
+        return cls(dataset, reader, preprocessing, metrics_executor, launcher, model)
+
+    def process_dataset(self, stored_predictions, progress_reporter, *args, **kwargs):
+        self._annotations, self._predictions = ([],
+                                                []) if self.metric_executor.need_store_predictions else None, None
+        if progress_reporter:
+            progress_reporter.reset(self.dataset.size)
+
+        for batch_id, (dataset_indices, batch_annotation) in enumerate(self.dataset):
+
+            batch_identifiers = [annotation.identifier for annotation in batch_annotation]
+            batch_input = [self.reader(identifier=identifier) for identifier in batch_identifiers]
+            batch_input = self.preprocessing_executor.process(batch_input, batch_annotation)
+            batch_input, batch_meta = extract_image_representations(batch_input)
+            batch_prediction = self.model.predict(batch_identifiers, batch_input, batch_meta)
+            self.metric_executor.update_metrics_on_batch(dataset_indices, batch_annotation,
+                                                         batch_prediction)
+            if self.metric_executor.need_store_predictions:
+                self._annotations.extend(batch_annotation)
+                self._predictions.extend(batch_prediction)
+
+            progress_reporter.update(batch_id, len(batch_prediction))
+
+        if progress_reporter:
+            progress_reporter.finish()
+
+    def compute_metrics(self, print_results=True, ignore_results_formatting=False):
+        if self._metrics_results:
+            del self._metrics_results
+            self._metrics_results = []
+
+        for result_presenter, evaluated_metric in self.metric_executor.iterate_metrics(
+            self._annotations, self._predictions):
+            self._metrics_results.append(evaluated_metric)
+            if print_results:
+                result_presenter.write_result(evaluated_metric, ignore_results_formatting)
+
+        return self._metrics_results
+
+    def extract_metrics_results(self, print_results=True, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(False, ignore_results_formatting)
+
+        result_presenters = self.metric_executor.get_metric_presenters()
+        extracted_results, extracted_meta = [], []
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            result, metadata = presenter.extract_result(metric_result)
+            if isinstance(result, list):
+                extracted_results.extend(result)
+                extracted_meta.extend(metadata)
+            else:
+                extracted_results.append(result)
+                extracted_meta.append(metadata)
+            if print_results:
+                presenter.write_result(metric_result, ignore_results_formatting)
+
+        return extracted_results, extracted_meta
+
+    def print_metrics_results(self, ignore_results_formatting=False):
+        if not self._metrics_results:
+            self.compute_metrics(True, ignore_results_formatting)
+            return
+        result_presenters = self.metric_executor.get_metric_presenters()
+        for presenter, metric_result in zip(result_presenters, self._metrics_results):
+            presenter.write_result(metric_result, ignore_results_formatting)
+
+    def release(self):
+        self.model.release()
+        self.launcher.release()
+
+    def reset(self):
+        self.metric_executor.reset()
+        self.model.reset()
+
+    @staticmethod
+    def get_processing_info(config):
+        module_specific_params = config.get('module_config')
+        model_name = config['name']
+        dataset_config = module_specific_params['datasets'][0]
+        launcher_config = module_specific_params['launchers'][0]
+        return (
+            model_name, launcher_config['framework'], launcher_config['device'],
+            launcher_config.get('tags'),
+            dataset_config['name']
+        )
+
+
+class BaseModel:
+    def __init__(self, network_info, launcher):
+        self.network_info = network_info
+
+    def predict(self, idenitifers, input_data):
+        raise NotImplementedError
+
+    def release(self):
+        pass
+
+
+def create_detector(model_config, launcher):
+    launcher_model_mapping = {
+        'dlsdk': DetectorDLSDKModel
+    }
+    framework = launcher.config['framework']
+    model_class = launcher_model_mapping.get(framework)
+    if not model_class:
+        raise ValueError('model for framework {} is not supported'.format(framework))
+    return model_class(model_config, launcher)
+
+
+def create_recognizer(model_config, launcher):
+    launcher_model_mapping = {
+        'dlsdk': RecognizerDLSDKModel
+    }
+    framework = launcher.config['framework']
+    model_class = launcher_model_mapping.get(framework)
+    if not model_class:
+        raise ValueError('model for framework {} is not supported'.format(framework))
+    return model_class(model_config, launcher)
+
+
+class SequentialModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        if not contains_all(network_info, ['detector', 'recognizer_encoder', 'recognizer_decoder']):
+            raise ConfigError('network_info should contains detector, encoder and decoder fields')
+        self.detector = create_detector(network_info['detector'], launcher)
+        self.recognizer_encoder = create_recognizer(network_info['recognizer_encoder'], launcher)
+        self.recognizer_decoder = create_recognizer(network_info['recognizer_decoder'], launcher)
+        self.recognizer_decoder_inputs = network_info['recognizer_decoder_inputs']
+        self.recognizer_decoder_outputs = network_info['recognizer_decoder_outputs']
+        self.max_seq_len = int(network_info['max_seq_len'])
+        self.adapter = create_adapter(network_info['adapter'])
+        self.alphabet = network_info['alphabet']
+        self.sos_index = int(network_info['sos_index'])
+        self.eos_index = int(network_info['eos_index'])
+
+    def predict(self, idenitifiers, input_data, frame_meta):
+        assert len(idenitifiers) == 1
+
+        detector_outputs = self.detector.predict(idenitifiers, input_data)
+        text_features = detector_outputs['text_features']
+
+        texts = []
+        for feature in text_features:
+            feature = self.recognizer_encoder.predict(idenitifiers, {'input': feature})['output']
+            feature = np.reshape(feature, (feature.shape[0], feature.shape[1], -1))
+            feature = np.transpose(feature, (0, 2, 1))
+
+            hidden_shape = self.recognizer_decoder.network.inputs[
+                self.recognizer_decoder_inputs['prev_hidden']].shape
+            hidden = np.zeros(hidden_shape)
+            prev_symbol_index = np.ones((1,)) * self.sos_index
+
+            text = str()
+
+            for i in range(self.max_seq_len):
+                input_to_decoder = {
+                    self.recognizer_decoder_inputs['prev_symbol']: prev_symbol_index,
+                    self.recognizer_decoder_inputs['prev_hidden']: hidden,
+                    self.recognizer_decoder_inputs['encoder_outputs']: feature}
+                decoder_outputs = self.recognizer_decoder.predict(idenitifiers, input_to_decoder)
+                coder_output = decoder_outputs[
+                    self.recognizer_decoder_outputs['symbols_distribution']]
+                prev_symbol_index = np.argmax(coder_output, axis=1)
+                if prev_symbol_index == self.eos_index:
+                    break
+                hidden = decoder_outputs[self.recognizer_decoder_outputs['cur_hidden']]
+                text += self.alphabet[int(prev_symbol_index)]
+            texts.append(text)
+
+        texts = np.array(texts)
+
+        detector_outputs['texts'] = texts
+        output = self.adapter.process(detector_outputs, idenitifiers, frame_meta)
+        return output
+
+    def reset(self):
+        pass
+
+    def release(self):
+        self.detector.release()
+        self.recognizer_encoder.release()
+        self.recognizer_decoder.release()
+
+
+class DetectorDLSDKModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        model_xml = str(network_info['model'])
+        model_bin = str(network_info['weights'])
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        if not hasattr(launcher, 'plugin'):
+            launcher.create_ie_plugin()
+        self.exec_network = launcher.plugin.load(self.network)
+        self.im_info_name = [x for x in self.network.inputs if len(self.network.inputs[x].shape) == 2][0]
+        self.im_data_name = [x for x in self.network.inputs if len(self.network.inputs[x].shape) == 4][0]
+
+    def predict(self, identifiers, input_data):
+        input_data = np.array(input_data)
+        assert len(input_data.shape) == 4
+        assert input_data.shape[0] == 1
+
+        input_data = {self.im_data_name: self.fit_to_input(input_data),
+                      self.im_info_name: np.array(
+                          [[input_data.shape[1], input_data.shape[2], 1.0]])}
+
+        output = self.exec_network.infer(input_data)
+
+        return output
+
+    def release(self):
+        del self.exec_network
+
+    def fit_to_input(self, input_data):
+        input_data = np.transpose(input_data, (0, 3, 1, 2))
+        input_data = input_data.reshape(self.network.inputs[self.im_data_name].shape)
+
+        return input_data
+
+
+class RecognizerDLSDKModel(BaseModel):
+    def __init__(self, network_info, launcher):
+        super().__init__(network_info, launcher)
+        model_xml = str(network_info['model'])
+        model_bin = str(network_info['weights'])
+
+        self.network = launcher.create_ie_network(model_xml, model_bin)
+        if hasattr(launcher, 'plugin'):
+            self.exec_network = launcher.plugin.load(self.network)
+        else:
+            launcher.load_network(self.network)
+            self.exec_network = launcher.exec_network
+
+    def predict(self, identifiers, input_data):
+        return self.exec_network.infer(input_data)
+
+    def release(self):
+        del self.exec_network
diff --git a/tools/accuracy_checker/data/test_models/pytorch_model/__init__.py b/tools/accuracy_checker/data/test_models/pytorch_model/__init__.py
new file mode 100644
index 00000000000..7c9fcf6dc14
--- /dev/null
+++ b/tools/accuracy_checker/data/test_models/pytorch_model/__init__.py
@@ -0,0 +1,15 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
diff --git a/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.pth b/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.pth
new file mode 100644
index 00000000000..6c70368e095
Binary files /dev/null and b/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.pth differ
diff --git a/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.py b/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.py
new file mode 100644
index 00000000000..a742a650c02
--- /dev/null
+++ b/tools/accuracy_checker/data/test_models/pytorch_model/samplenet.py
@@ -0,0 +1,38 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import torch.nn as nn
+import torch.nn.functional as F
+
+
+class SampLeNet(nn.Module):
+    def __init__(self):
+        super(SampLeNet, self).__init__()
+        self.conv1 = nn.Conv2d(3, 6, 5)
+        self.pool = nn.MaxPool2d(2, 2)
+        self.conv2 = nn.Conv2d(6, 16, 5)
+        self.fc1 = nn.Linear(16 * 5 * 5, 120)
+        self.fc2 = nn.Linear(120, 84)
+        self.fc3 = nn.Linear(84, 10)
+
+    def forward(self, x):
+        x = self.pool(F.relu(self.conv1(x)))
+        x = self.pool(F.relu(self.conv2(x)))
+        x = x.view(-1, 16 * 5 * 5)
+        x = F.relu(self.fc1(x))
+        x = F.relu(self.fc2(x))
+        x = self.fc3(x)
+        return x
diff --git a/tools/accuracy_checker/dataset_definitions.yml b/tools/accuracy_checker/dataset_definitions.yml
index 650e0f92b58..7f97a0a754d 100644
--- a/tools/accuracy_checker/dataset_definitions.yml
+++ b/tools/accuracy_checker/dataset_definitions.yml
@@ -1,7 +1,3 @@
-launchers:
-  - framework: dlsdk
-    cpu_extensions: AUTO
-
 datasets:
   - name: ms_coco_mask_rcnn
     annotation_conversion:
@@ -33,6 +29,21 @@ datasets:
     annotation: mscoco_mask_rcnn_short_91.pickle
     dataset_meta: mscoco_mask_rcnn_short_91.json
     data_source: val2017
+    preprocessing:
+      - type: resize
+        aspect_ratio_scale: fit_to_window
+        dst_height: 800
+        dst_width: 1365
+      - type: padding
+        dst_height: 800
+        dst_width: 1365
+        pad_type: right_bottom
+
+    postprocessing:
+      - type: faster_rcnn_postprocessing_resize
+        dst_height: 800
+        dst_width: 1365
+
 
   - name: ms_coco_detection_91_classes
     annotation_conversion:
@@ -44,6 +55,31 @@ datasets:
     annotation: mscoco_det_91.pickle
     dataset_meta: mscoco_det_91.json
     data_source: val2017
+    preprocessing:
+      - type: resize
+        aspect_ratio_scale: fit_to_window
+        dst_height: 600
+        dst_width: 1024
+      - type: padding
+        dst_height: 600
+        dst_width: 1024
+        pad_type: right_bottom
+
+    postprocessing:
+      - type: faster_rcnn_postprocessing_resize
+        dst_height: 600
+        dst_width: 1024
+
+  - name: ms_coco_detection_80_class_without_backgound
+    data_source: val2017
+    annotation_conversion:
+      converter: mscoco_detection
+      annotation_file: instances_val2017.json
+      has_background: False
+      sort_annotations: True
+      use_full_label_map: False
+    annotation:  mscoco_det_80.pickle
+    dataset_meta:  mscoco_det_80.json
 
   - name: ms_coco_keypoints
     data_source: val2017
@@ -64,12 +100,12 @@ datasets:
     annotation: imagenet1000.pickle
     data_source: ILSVRC2012_img_val
     metrics:
-    - name: accuracy@top1
-      type: accuracy
-      top_k: 1
-    - name: acciracy@top5
-      type: accuracy
-      top_k: 5
+      - name: accuracy@top1
+        type: accuracy
+        top_k: 1
+      - name: accuracy@top5
+        type: accuracy
+        top_k: 5
 
   - name: imagenet_1000_classes_2015
     annotation_conversion:
@@ -78,12 +114,12 @@ datasets:
     annotation: imagenet1000_2015.pickle
     data_source: ILSVRC2012_img_val
     metrics:
-    - name: accuracy@top1
-      type: accuracy
-      top_k: 1
-    - name: acciracy@top5
-      type: accuracy
-      top_k: 5
+      - name: accuracy@top1
+        type: accuracy
+        top_k: 1
+      - name: accuracy@top5
+        type: accuracy
+        top_k: 5
 
   - name: imagenet_1001_classes
     annotation_conversion:
@@ -93,12 +129,12 @@ datasets:
     annotation: imagenet1001.pickle
     data_source: ILSVRC2012_img_val
     metrics:
-    - name: accuracy@top1
-      type: accuracy
-      top_k: 1
-    - name: acciracy@top5
-      type: accuracy
-      top_k: 5
+      - name: accuracy@top1
+        type: accuracy
+        top_k: 1
+      - name: accuracy@top5
+        type: accuracy
+        top_k: 5
 
   - name: VOC2012
     annotation_conversion:
@@ -110,12 +146,29 @@ datasets:
     annotation: voc12.pickle
     dataset_meta: voc12.json
     postprocessing:
-    - type: resize_prediction_boxes
+      - type: resize_prediction_boxes
     metrics:
-    - type: map
-      integral: 11point
-      ignore_difficult: True
-      presenter: print_scalar
+      - type: map
+        integral: 11point
+        ignore_difficult: True
+        presenter: print_scalar
+
+  - name: VOC2012_without_background
+    annotation_conversion:
+      converter: voc_detection
+      annotations_dir: VOCdevkit/VOC2012/Annotations
+      images_dir: VOCdevkit/VOC2012/JPEGImages
+      imageset_file: VOCdevkit/VOC2012/ImageSets/Main/val.txt
+    data_source: VOCdevkit/VOC2012/JPEGImages
+    annotation: voc12_without_background.pickle
+    dataset_meta: voc12_without_background.json
+    postprocessing:
+      - type: resize_prediction_boxes
+    metrics:
+      - type: map
+        integral: 11point
+        ignore_difficult: True
+        presenter: print_scalar
 
   - name: VOC2012_Segmentation
     annotation_conversion:
@@ -244,6 +297,17 @@ datasets:
     annotation: mscoco_person_detection.pickle
     dataset_meta: mscoco_person_detection.json
 
+  - name: mscoco_person_detection
+    data_source: val2017
+    annotation_conversion:
+      converter: mscoco_detection
+      annotation_file: person_keypoints_val2017.json
+      has_background: True
+      sort_annotations: True
+      use_full_label_map: True
+    annotation: mscoco_person_detection.pickle
+    dataset_meta: mscoco_person_detection.json
+
   - name: crossroad_dataset_1016
     data_source: val2017
     annotation_conversion:
@@ -303,9 +367,15 @@ datasets:
     annotation: lpr.pickle
     dataset_meta: lpr.json
 
+    preprocessing:
+      - type: resize
+        dst_width: 94
+        dst_height: 24
+
+
   - name: image_retrieval
     data_source: textile_crops
-    annotattion_conversion:
+    annotation_conversion:
       converter: image_retrieval
       data_dir: textile_crops
       gallery_annotation_file: textile_crops/gallery/gallery.txt
@@ -315,3 +385,278 @@ datasets:
     preprocessing:
       - type: resize
         size: 224
+
+  - name: lfw
+    data_source: LFW/lfw
+    annotation_conversion:
+      converter: lfw
+      pairs_file: LFW/annotation/pairs.txt
+      landmarks_file: LFW/annotation/lfw_landmark.txt
+    annotation: lfw.pickle
+
+    metrics:
+      - type: pairwise_accuracy_subsets
+        subset_number: 2
+
+  - name: ICDAR2015
+    data_source: ICDAR15_DET/ch4_test_images
+    annotation_conversion:
+      converter: icdar_detection
+      data_dir: ICDAR15_DET/gt
+    annotation: icdar15_detection.pickle
+
+  - name: ICDAR2015_word_spotting
+    data_source: ICDAR15_DET/ch4_test_images
+    annotation_conversion:
+      converter: icdar_detection
+      word_spotting: True
+      data_dir: ICDAR15_DET/gt
+    annotation: icdar15_detection.pickle
+
+  - name: ICDAR2013
+    data_source: ICDAR13_REC/Challenge2_Test_Task3_Images
+    annotation_conversion:
+      converter: icdar13_recognition
+      annotation_file: ICDAR13_REC/gt/gt.txt.fixed.alfanumeric
+    annotation: icdar13_recognition.pickle
+    dataset_meta: icdar13_recognition.json
+
+  - name: market1501
+    data_source: Market-1501-v15.09.15
+    annotation_conversion:
+      converter: market1501_reid
+      data_dir: Market-1501-v15.09.15
+    annotation: market1501_reid.pickle
+
+  - name: globalme-reid
+    data_source: GlobalMe-reID
+    annotation_conversion:
+      converter: market1501_reid
+      data_dir: globalme-reid/GlobalMe-reID
+    annotation: globalme-reid.pickle
+
+  - name: vgg2face
+    data_source: VGGFaces2/test
+    annotation_conversion:
+      converter: vgg_face
+      landmarks_csv_file: VGGFaces2/bb_landmark/loose_landmark_test.csv
+      bbox_csv_file: VGGFaces2/bb_landmark/loose_bb_test.csv
+    annotation: vggfaces2.pickle
+    dataset_meta: vggfaces2.json
+
+  - name: semantic_segmentation_adas
+    data_source: segmentation
+    annotation_conversion:
+      converter: common_semantic_segmentation
+      images_dir: segmentation/images
+      masks_dir: segmentation/mask_segmentation_adas
+      image_postfix: .JPEG
+      mask_postfix: .png
+      dataset_meta: segmentation/mask_segmentation_adas/dataset_meta.json
+    annotation: semantic_segmentation_adas.pickle
+    dataset_meta: semantic_segmentation_adas.json
+
+    preprocessing:
+      - type: resize
+        dst_height: 1024
+        dst_width: 2048
+
+    postprocessing:
+      - type: encode_segmentation_mask
+        apply_to: annotation
+      - type: resize_segmentation_mask
+        apply_to: annotation
+        dst_height: 1024
+        dst_width: 2048
+
+  - name: road_segmentation
+    data_source: segmentation
+    annotation_conversion:
+      converter: common_semantic_segmentation
+      images_dir: segmentation/images
+      masks_dir: segmentation/mask_road_segmentation
+      image_postfix: .JPEG
+      mask_postfix: .png
+      dataset_meta: segmentation/mask_road_segmentation/dataset_meta.json
+    annotation: road_segmentation.pickle
+    dataset_meta: road_segmentation.json
+
+    preprocessing:
+      - type: resize
+        dst_height: 512
+        dst_width: 896
+
+    postprocessing:
+      - type: encode_segmentation_mask
+        apply_to: annotation
+      - type: resize_segmentation_mask
+        apply_to: annotation
+        dst_height: 512
+        dst_width: 896
+
+    metrics:
+      - type: mean_iou
+        presenter: print_vector
+      - type: mean_accuracy
+        presenter: print_vector
+
+  - name: super_resolution_x3
+    data_source: super_resolution
+    annotation_conversion:
+      converter: super_resolution
+      data_dir: super_resolution
+      lr_suffix: lr_x3
+      upsample_suffix: upsample_x3
+      hr_suffix: hr
+      two_streams: True
+    annotation: super_resolution_x3.pickle
+
+    metrics:
+      - type: psnr
+        scale_border: 4
+        presenter: print_vector
+
+  - name: super_resolution_x4
+    data_source: super_resolution
+    annotation_conversion:
+      converter: super_resolution
+      data_dir: super_resolution
+      lr_suffix: lr_x4
+      upsample_suffix: upsample_x4
+      hr_suffix: hr
+      two_streams: True
+    annotation: super_resolution_x4.pickle
+
+    metrics:
+      - type: psnr
+        scale_border: 4
+        presenter: print_vector
+
+  - name: text_super_resolution_x3
+    data_source: super_resolution
+    annotation_conversion:
+      converter: super_resolution
+      data_dir: super_resolution
+      lr_suffix: lr_x3
+      hr_suffix: hr_gray
+    annotation: text_super_resolution_x3.pickle
+
+    preprocessing:
+      - type: bgr_to_gray
+
+    metrics:
+      - type: psnr
+        scale_border: 4
+        presenter: print_vector
+
+  - name: head_pose
+    data_source: WIDER_val/images/16--Award_Ceremony
+    annotation: head_pose.pickle
+
+    preprocessing:
+      - type: crop_rect
+      - type: resize
+        size: 60
+
+  - name: gaze_estimation_dataset
+    data_source: gaze_estimation
+    annotation: gaze_estimation.pickle
+
+    reader:
+      type: combine_reader
+      scheme:
+        ".*.png": opencv_imread
+        ".*.json":
+          type: json_reader
+          key: head_pose_angles
+
+  - name: handwritten_score_recognition
+    data_source: ILSVRC2012_img_val
+    annotation: handwritten_score_recognition.pickle
+    dataset_meta: handwritten_score_recognition.json
+
+  - name: cmu_panoptic_keypoints
+    data_source: cmu_panoptic_subset
+    annotation_conversion:
+      converter: cmu_panoptic_keypoints
+      data_dir: cmu_panoptic_subset
+    annotation: cmu_panoptic_keypoints.pickle
+
+  - name: kinetics-400
+    data_source: kinetics/frames_val
+    annotation_conversion:
+      converter: clip_action_recognition
+      annotation_file: kinetics/kinetics_400.json
+      data_dir: kinetics/frames_val
+    annotation: kinetics_action_recognition.pickle
+    dataset_meta: kinetics_action_recognition.json
+
+  - name: driver_action_recognition_dataset
+    data_source: kinetics/frames_val
+    annotation_conversion:
+      converter: clip_action_recognition
+      annotation_file: kinetics/driver_action_recognition.json
+      data_dir: kinetics/frames_val
+    annotation: driver_action_recognition.pickle
+    dataset_meta: driver_action_recognition.json
+
+  - name: BraTS
+    data_source: BraTS
+    reader: numpy_reader
+    annotation_conversion:
+      converter: brats_numpy
+      data_dir: BraTS
+      ids_file: BraTS/val_ids.p
+      labels_file: BraTS/labels
+    annotation: brats.pickle
+    dataset_meta: brats.json
+
+  - name: BraTS_2017
+    data_source: BraTS_2017
+    reader:
+      type: nifti_reader
+      channels_first: True
+    annotation_conversion:
+      converter: brats
+      data_dir: BraTS_2017
+      labels_file: BraTS_2017/labels
+      mask_channels_first: True
+    annotation: brats2017.pickle
+    dataset_meta: brats2017.json
+
+  - name: product_detection
+    annotation: product_detection.pickle
+    dataset_meta: product_detection.json
+    data_source: product_detection
+
+    metrics:
+      - type: coco_precision
+
+  - name: ms_coco_single_keypoints
+    data_source: val2017
+    annotation_conversion:
+      converter: mscoco_single_keypoints
+      annotation_file: person_keypoints_val2017.json
+    annotation: mscoco_single_keypoints.pickle
+    dataset_meta: mscoco_single_keypoints.json
+    metrics:
+      - name: AP
+        type: coco_orig_keypoints_precision
+
+  - name: CamVid
+    data_source: CamVid
+    annotation_conversion:
+      converter: camvid
+      annotation_file: CamVid/val.txt
+    annotation: camvid.pickle
+    dataset_meta: camvid.json
+
+  - name: msasl-100
+    data_source: msasl/global_crops
+    annotation_conversion:
+      converter: continuous_clip_action_recognition
+      annotation_file: msasl/msasl_100.txt
+      data_dir: msasl/global_crops
+      out_fps: 15
+      clip_length: 16
+    annotation: msasl/msasl_action_recognition.pickle
diff --git a/tools/accuracy_checker/pytest.ini b/tools/accuracy_checker/pytest.ini
new file mode 100644
index 00000000000..fe55d2ed64b
--- /dev/null
+++ b/tools/accuracy_checker/pytest.ini
@@ -0,0 +1,2 @@
+[pytest]
+junit_family=xunit2
diff --git a/tools/accuracy_checker/requirements-test.in b/tools/accuracy_checker/requirements-test.in
new file mode 100644
index 00000000000..62075023174
--- /dev/null
+++ b/tools/accuracy_checker/requirements-test.in
@@ -0,0 +1,2 @@
+pytest~=5.0
+pytest-mock~=2.0
diff --git a/tools/accuracy_checker/requirements.in b/tools/accuracy_checker/requirements.in
new file mode 100644
index 00000000000..ed2bc2f588e
--- /dev/null
+++ b/tools/accuracy_checker/requirements.in
@@ -0,0 +1,28 @@
+# core components
+numpy>=1.11,<1.18
+PyYAML
+
+# progress bar
+tqdm
+
+# image reading and preprocessing
+pillow>=2.6.1
+
+# reid
+scikit-learn
+
+# pipelining mode
+yamlloader
+
+# cpu extension usage
+py-cpuinfo<=4.0
+
+# text detection
+shapely
+
+# brain tumor segmentation
+nibabel
+scipy
+
+# nlp, tokenization
+sentencepiece
diff --git a/tools/accuracy_checker/sample/README.md b/tools/accuracy_checker/sample/README.md
index cbf8cfd6e6e..a7cbc3186a4 100644
--- a/tools/accuracy_checker/sample/README.md
+++ b/tools/accuracy_checker/sample/README.md
@@ -37,4 +37,4 @@ Used options: `-c` path to evaluation config, `-m` directory where models are st
 
 If everything worked correctly, you should be able to get `75.02%` accuracy.
 
-Now try edit config, to run SampLeNet on other device or framework (e.g. Caffe, MxNet or OpenCV), or go directly to your topology!
+Now try edit config, to run SampLeNet on other device or framework (e.g. Caffe, MXNet or OpenCV), or go directly to your topology!
diff --git a/tools/accuracy_checker/sample/opencv_sample_config.yml b/tools/accuracy_checker/sample/opencv_sample_config.yml
index 7eca2150de2..c263a3a3190 100644
--- a/tools/accuracy_checker/sample/opencv_sample_config.yml
+++ b/tools/accuracy_checker/sample/opencv_sample_config.yml
@@ -47,7 +47,7 @@ models:
           #  In order to do this you need to provide your own annotation converter,
           # i.e. implement BaseFormatConverter interface.
           # All annotation converters are stored in accuracy_checker/annotation_converters directory.
-          converter: cifar10
+          converter: cifar
           # converter specific parameters.
           # Full range available options you can find in accuracy_checker/annotation_converters/README.md
           # relative paths will be merged with "-s/--source" option
@@ -57,6 +57,8 @@ models:
           convert_images: True
           # path to save converted images.
           converted_images_dir: sample_dataset/test
+          # number of classes in the dataset, used for label_map generation
+          num_classes: 10
 
         # list of preprocessing, applied to each image during validation
         # order of entries matters
diff --git a/tools/accuracy_checker/sample/sample_config.yml b/tools/accuracy_checker/sample/sample_config.yml
index 6d9652a870d..f3fe5bafe85 100644
--- a/tools/accuracy_checker/sample/sample_config.yml
+++ b/tools/accuracy_checker/sample/sample_config.yml
@@ -38,7 +38,7 @@ models:
           #  In order to do this you need to provide your own annotation converter,
           # i.e. implement BaseFormatConverter interface.
           # All annotation converters are stored in accuracy_checker/annotation_converters directory.
-          converter: cifar10
+          converter: cifar
           # converter specific parameters.
           # Full range available options you can find in accuracy_checker/annotation_converters/README.md
           # relative paths will be merged with "-s/--source" option
@@ -48,6 +48,8 @@ models:
           convert_images: True
           # path to save converted images.
           converted_images_dir: sample_dataset/test
+          # number of classes in the dataset, used for label_map generation
+          num_classes: 10
 
         # list of preprocessing, applied to each image during validation
         # order of entries matters
diff --git a/tools/accuracy_checker/setup.cfg b/tools/accuracy_checker/setup.cfg
index 7c49a45db3c..ad131b321c4 100644
--- a/tools/accuracy_checker/setup.cfg
+++ b/tools/accuracy_checker/setup.cfg
@@ -5,4 +5,4 @@ ignore = F401
 [isort]
 line_length = 120
 use_parentheses = True
-known_third_party = openvino.inference_engine,caffe,cv2,mxnet,tensorflow
+known_third_party = openvino.inference_engine,caffe,cv2,mxnet,tensorflow,torch
diff --git a/tools/accuracy_checker/setup.py b/tools/accuracy_checker/setup.py
index 417f189206c..45ccbf96c3b 100644
--- a/tools/accuracy_checker/setup.py
+++ b/tools/accuracy_checker/setup.py
@@ -17,31 +17,10 @@
 import importlib
 import re
 import sys
-from collections import OrderedDict
 from setuptools import find_packages, setup
 from setuptools.command.test import test as test_command
 from pathlib import Path
 
-requirements = OrderedDict([
-    ('NumPy', 'numpy'),
-    ('tqdm', 'tqdm'),
-    ('PyYAML', 'PyYAML'),
-    ('ymlloader', 'yamlloader'),
-    ('Pillow', 'pillow'),
-    ('scikit-learn', 'scikit-learn'),
-    ('scipy', 'scipy<1.2'),
-    ('cpuinfo', 'py-cpuinfo<=4.0'),
-    ('shapely', 'shapely'),
-    ('nibabel', 'nibabel')
-])
-
-try:
-    importlib.import_module('cv2')
-except ImportError:
-    requirements['opencv'] = 'opencv-python'
-
-tests_requirements = OrderedDict([("PyTest", 'pytest==4.0.0'), ("PyTest Mock", 'pytest-mock==1.10.4')])
-
 
 class PyTest(test_command):
     user_options = [('pytest-args=', 'a', "Arguments to pass to pytest")]
@@ -77,6 +56,13 @@ def find_version(*path):
 long_description = read("README.md")
 version = find_version("accuracy_checker", "__init__.py")
 
+requirements = [read("requirements.in")]
+
+try:
+    importlib.import_module('cv2')
+except ImportError:
+    requirements.append('opencv-python')
+
 setup(
     name="accuracy_checker",
     description="Deep Learning Accuracy validation framework",
@@ -90,7 +76,7 @@ def find_version(*path):
     ]},
     zip_safe=False,
     python_requires='>=3.5',
-    install_requires=list(requirements.values()),
-    tests_require=list(tests_requirements.values()),
+    install_requires=requirements,
+    tests_require=[read("requirements-test.in")],
     cmdclass={'test': PyTest}
 )
diff --git a/tools/accuracy_checker/tests/common.py b/tools/accuracy_checker/tests/common.py
index 063a6cd7399..7195bdd2cc3 100644
--- a/tools/accuracy_checker/tests/common.py
+++ b/tools/accuracy_checker/tests/common.py
@@ -57,10 +57,10 @@ def make_representation(bounding_boxes, is_ground_truth=False, score=None, meta=
 
     result = []
     for idx, box in enumerate(bounding_boxes):
-        arr = np.array(np.mat(box))
-
         if box == "":
             arr = np.array([]).reshape((0, 5))
+        else:
+            arr = np.array([np.fromstring(row, sep=' ') for row in box.split(';')])
 
         if is_ground_truth or score:
             assert arr.shape[1] == 5
diff --git a/tools/accuracy_checker/tests/test_adapters.py b/tools/accuracy_checker/tests/test_adapters.py
index 3e363132e8a..f834bc0228b 100644
--- a/tools/accuracy_checker/tests/test_adapters.py
+++ b/tools/accuracy_checker/tests/test_adapters.py
@@ -26,7 +26,7 @@ def test_detection_adapter():
     raw = {
         'detection_out': np.array([[[[0, 3, 0.2, 0, 0, 1, 1], [0, 2, 0.5, 4, 4, 7, 7], [0, 5, 0.7, 3, 3, 9, 8]]]])
     }
-    expected = make_representation('0.2,3,0,0,1,1;0.5,2,4,4,7,7;0.7,5,3,3,9,8')
+    expected = make_representation('0.2 3 0 0 1 1;0.5 2 4 4 7 7;0.7 5 3 3 9 8')
 
     actual = SSDAdapter({}, output_blob='detection_out').process([raw], ['0'], [{}])
 
@@ -39,7 +39,7 @@ def test_detection_adapter_partially_filling_output_blob():
             [[[[0, 3, 0.2, 0, 0, 1, 1], [0, 2, 0.5, 4, 4, 7, 7], [0, 5, 0.7, 3, 3, 9, 8], [-1, 0, 0, 0, 0, 0, 0]]]]
         )
     }
-    expected = make_representation('0.2,3,0,0,1,1;0.5,2,4,4,7,7;0.7,5,3,3,9,8')
+    expected = make_representation('0.2 3 0 0 1 1;0.5 2 4 4 7 7;0.7 5 3 3 9 8')
 
     actual = SSDAdapter({}, output_blob='detection_out').process([raw], ['0'])
 
@@ -56,7 +56,7 @@ def test_detection_adapter_partially_filling_output_blob_with_zeros_at_the_end()
             [0,  0, 0,   0, 0, 0, 0]
         ]]])
     }
-    expected = make_representation('0.2,3,0,0,1,1;0.5,2,4,4,7,7;0.7,5,3,3,9,8')
+    expected = make_representation('0.2 3 0 0 1 1;0.5 2 4 4 7 7;0.7 5 3 3 9 8')
 
     actual = SSDAdapter({}, output_blob='detection_out').process([raw], ['0'])
 
@@ -67,7 +67,7 @@ def test_detection_adapter_batch_2():
     raw = {
         'detection_out': np.array([[[[0, 3, 0.2, 0, 0, 1, 1], [0, 2, 0.5, 4, 4, 7, 7], [1, 5, 0.7, 3, 3, 9, 8]]]])
     }
-    expected = make_representation(['0.2,3,0,0,1,1;0.5,2,4,4,7,7', '0.7,5,3,3,9,8'])
+    expected = make_representation(['0.2 3 0 0 1 1;0.5 2 4 4 7 7', '0.7 5 3 3 9 8'])
 
     actual = SSDAdapter({}, output_blob='detection_out').process([raw], ['0', '1'])
 
diff --git a/tools/accuracy_checker/tests/test_caffe_launcher.py b/tools/accuracy_checker/tests/test_caffe_launcher.py
index a68b40bb71d..f4fb99db86d 100644
--- a/tools/accuracy_checker/tests/test_caffe_launcher.py
+++ b/tools/accuracy_checker/tests/test_caffe_launcher.py
@@ -71,4 +71,3 @@ def test_missed_weights_in_create_caffe_launcher_raises_config_error_exception()
 
     with pytest.raises(ConfigError):
         create_launcher(launcher)
-
diff --git a/tools/accuracy_checker/tests/test_config_reader.py b/tools/accuracy_checker/tests/test_config_reader.py
index 5bbc72cd8c8..7286836c42f 100644
--- a/tools/accuracy_checker/tests/test_config_reader.py
+++ b/tools/accuracy_checker/tests/test_config_reader.py
@@ -88,7 +88,7 @@ def setup_method(self):
             'bitstreams': Path('bitstreams/'),
             'definitions': None,
             'stored_predictions': None,
-            'tf_custom_op_config': None,
+            'tf_custom_op_config_dir': None,
             'tf_obj_detection_api_pipeline_config_path': None,
             'progress': 'bar',
             'target_framework': None,
@@ -96,22 +96,24 @@ def setup_method(self):
             'log_file': None,
             'target_tags': None,
             'cpu_extensions_mode': None,
-            'aocl': None
+            'aocl': None,
+            'deprecated_ir_v7': False,
+            'transformations_config_dir': None
         })
 
     def test_read_configs_without_global_config(self, mocker):
         config = {'models': [{
             'name': 'model',
-            'launchers': [{'framework': 'dlsdk', 'model': Path('/absolute_path'), 'weights': Path('/absolute_path')}],
+            'launchers': [{'framework': 'dlsdk', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute(), '_models_prefix': Path.cwd()}],
             'datasets': [{'name': 'global_dataset'}]
         }]}
         empty_args = Namespace(**{
-            'models': None, 'extensions': None, 'source': None, 'annotations': None,
-            'converted_models': None, 'model_optimizer': None, 'bitstreams': None,
-            'definitions': None, 'config': None, 'stored_predictions': None, 'tf_custom_op_config': None,
+            'models': Path.cwd(), 'extensions': Path.cwd(), 'source': Path.cwd(), 'annotations': Path.cwd(),
+            'converted_models': None, 'model_optimizer': None, 'bitstreams': Path.cwd(),
+            'definitions': None, 'config': None, 'stored_predictions': None, 'tf_custom_op_config_dir': None,
             'progress': 'bar', 'target_framework': None, 'target_devices': None, 'log_file': None,
             'tf_obj_detection_api_pipeline_config_path': None, 'target_tags': None, 'cpu_extensions_mode': None,
-            'aocl': None
+            'aocl': None, 'deprecated_ir_v7': False, 'transformations_config_dir': None
         })
         mocker.patch('accuracy_checker.utils.get_path', return_value=Path.cwd())
         mocker.patch('yaml.load', return_value=config)
@@ -130,7 +132,7 @@ def test_empty_local_config_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Missing local config'
 
     def test_missed_models_in_local_config_raises_value_error_exception(self, mocker):
@@ -141,8 +143,8 @@ def test_missed_models_in_local_config_raises_value_error_exception(self, mocker
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
-        assert error_message == 'Missed "{}" in local config'.format('models')
+        error_message = str(exception.value).split(sep=': ')[-1]
+        assert error_message == 'Accuracy Checker not_models mode is not supported. Please select between evaluations, models, pipelines'
 
     def test_empty_models_in_local_config_raises_value_error_exception(self, mocker):
         mocker.patch(self.module + '._read_configs', return_value=(
@@ -152,7 +154,7 @@ def test_empty_models_in_local_config_raises_value_error_exception(self, mocker)
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Missed "{}" in local config'.format('models')
 
     def test_missed_name_in_model_raises_value_error_exception(self, mocker):
@@ -163,7 +165,7 @@ def test_missed_name_in_model_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each model must specify {}'.format(', '.join(['name', 'launchers', 'datasets']))
 
     def test_missed_launchers_in_model_raises_value_error_exception(self, mocker):
@@ -174,7 +176,7 @@ def test_missed_launchers_in_model_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each model must specify {}'.format(', '.join(['name', 'launchers', 'datasets']))
 
     def test_missed_datasets_in_model_raises_value_error_exception(self, mocker):
@@ -185,7 +187,7 @@ def test_missed_datasets_in_model_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each model must specify {}'.format(', '.join(['name', 'launchers', 'datasets']))
 
     def test_invalid_model_raises_value_error_exception(self, mocker):
@@ -196,7 +198,7 @@ def test_invalid_model_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each model must specify {}'.format(', '.join(['name', 'launchers', 'datasets']))
 
     def test_empty_pipeline_in_local_config_raises_value_error_exception(self, mocker):
@@ -207,7 +209,7 @@ def test_empty_pipeline_in_local_config_raises_value_error_exception(self, mocke
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Missed "{}" in local config'.format('pipelines')
 
     def test_missed_name_in_pipeline_raises_value_error_exception(self, mocker):
@@ -218,7 +220,7 @@ def test_missed_name_in_pipeline_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each pipeline must specify {}'.format(', '.join(['name', 'stages']))
 
     def test_missed_stages_in_pipeline_raises_value_error_exception(self, mocker):
@@ -229,7 +231,7 @@ def test_missed_stages_in_pipeline_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each pipeline must specify {}'.format(', '.join(['name', 'stages']))
 
     def test_invalid_pipeline_raises_value_error_exception(self, mocker):
@@ -240,7 +242,7 @@ def test_invalid_pipeline_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each pipeline must specify {}'.format(', '.join(['name', 'stages']))
 
     def test_pipeline_empty_stages_raises_value_error_exception(self, mocker):
@@ -251,7 +253,7 @@ def test_pipeline_empty_stages_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Each pipeline must specify {}'.format(', '.join(['name', 'stages']))
 
     def test_pipeline_first_stage_does_not_contain_dataset_raises_value_error_exception(self, mocker):
@@ -264,7 +266,7 @@ def test_pipeline_first_stage_does_not_contain_dataset_raises_value_error_except
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'First stage should contain dataset'
 
     def test_pipeline_contains_several_datasets_raises_value_error_exception(self, mocker):
@@ -291,7 +293,7 @@ def test_pipeline_contains_several_datasets_raises_value_error_exception(self, m
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Exactly one dataset per pipeline is supported'
 
     def test_pipeline_without_launchers_raises_value_error_exception(self, mocker):
@@ -311,7 +313,7 @@ def test_pipeline_without_launchers_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Launchers are not specified'
 
     def test_pipeline_without_metrics_raises_value_error_exception(self, mocker):
@@ -330,13 +332,13 @@ def test_pipeline_without_metrics_raises_value_error_exception(self, mocker):
         with pytest.raises(ConfigError) as exception:
             ConfigReader.merge(self.arguments)
 
-        error_message = str(exception).split(sep=': ')[-1]
+        error_message = str(exception.value).split(sep=': ')[-1]
         assert error_message == 'Metrics are not specified'
 
     def test_merge_datasets_with_definitions(self, mocker):
         local_config = {'models': [{
             'name': 'model',
-            'launchers': [{'framework': 'dlsdk', 'model': '/absolute_path', 'weights': '/absolute_path'}],
+            'launchers': [{'framework': 'dlsdk', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}],
             'datasets': [{'name': 'global_dataset'}]
         }]}
         mocker.patch(self.module + '._read_configs', return_value=(
@@ -354,7 +356,7 @@ def test_merge_datasets_with_definitions(self, mocker):
     def test_merge_datasets_with_definitions_and_meta_is_not_modified(self, mocker):
         local_config = {'models': [{
             'name': 'model',
-            'launchers': [{'framework': 'dlsdk', 'model': '/absolute_path', 'weights': '/absolute_path'}],
+            'launchers': [{'framework': 'dlsdk', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}],
             'datasets': [{'name': 'global_dataset', 'dataset_meta': '/absolute_path'}]
         }]}
         expected = self.global_datasets[0]
@@ -403,21 +405,91 @@ def test_expand_relative_paths_in_datasets_config_using_command_line(self, mocke
 
             assert config['models'][0]['datasets'][0] == expected
 
+    def test_expand_relative_paths_in_datasets_config_using_env_variable(self, mocker):
+        local_config = {'models': [{
+            'name': 'model',
+            'launchers': [{'framework': 'caffe'}],
+            'datasets': [{
+                'name': 'global_dataset',
+                'dataset_meta': 'relative_annotation_path',
+                'data_source': 'relative_source_path',
+                'segmentation_masks_source': 'relative_source_path',
+                'annotation': 'relative_annotation_path'
+            }]
+        }]}
+
+        mocker.patch(self.module + '._read_configs', return_value=(
+            None, local_config
+        ))
+        expected = copy.deepcopy(local_config['models'][0]['datasets'][0])
+        with mock_filesystem(['source_2/']) as env_prefix:
+            mocker.patch('os.environ.get', return_value=str(env_prefix))
+        with mock_filesystem(['source/', 'annotations/']) as prefix:
+            expected['annotation'] = prefix / self.arguments.annotations / 'relative_annotation_path'
+            expected['dataset_meta'] = prefix / self.arguments.annotations / 'relative_annotation_path'
+            expected['segmentation_masks_source'] = prefix / self.arguments.source / 'relative_source_path'
+            expected['data_source'] = prefix / self.arguments.source / 'relative_source_path'
+
+            arguments = copy.deepcopy(self.arguments)
+            arguments.bitstreams = None
+            arguments.extensions = None
+            arguments.source = prefix / arguments.source
+            arguments.annotations = prefix / self.arguments.annotations
+
+            config = ConfigReader.merge(arguments)[0]
+
+            assert config['models'][0]['datasets'][0] == expected
+
+    def test_not_overwrite_relative_paths_in_datasets_config_using_env_variable_if_commandline_provided(self, mocker):
+        local_config = {'models': [{
+            'name': 'model',
+            'launchers': [{'framework': 'caffe'}],
+            'datasets': [{
+                'name': 'global_dataset',
+                'dataset_meta': 'relative_annotation_path',
+                'data_source': 'relative_source_path',
+                'segmentation_masks_source': 'relative_source_path',
+                'annotation': 'relative_annotation_path'
+            }]
+        }]}
+
+        mocker.patch(self.module + '._read_configs', return_value=(
+            None, local_config
+        ))
+        expected = copy.deepcopy(local_config['models'][0]['datasets'][0])
+        with mock_filesystem(['source/']) as prefix:
+            mocker.patch('os.environ.get', return_value=str(prefix))
+            expected['dataset_meta'] = prefix / 'relative_annotation_path'
+            expected['segmentation_masks_source'] = prefix / 'relative_source_path'
+            expected['data_source'] = prefix / 'relative_source_path'
+            expected['annotation'] = prefix / 'relative_annotation_path'
+            expected['dataset_meta'] = prefix / 'relative_annotation_path'
+
+            arguments = copy.deepcopy(self.arguments)
+            arguments.bitstreams = None
+            arguments.extensions = None
+            arguments.source = None
+            arguments.annotations = None
+
+            config = ConfigReader.merge(arguments)[0]
+
+            assert config['models'][0]['datasets'][0] == expected
+
     def test_not_modify_absolute_paths_in_datasets_config_using_command_line(self):
         local_config = {'models': [{
             'name': 'model',
             'datasets': [{
                 'name': 'global_dataset',
-                'dataset_meta': '/absolute_annotation_meta_path',
-                'data_source': '/absolute_source_path',
-                'annotation': '/absolute_annotation_path',
+                'dataset_meta': Path('/absolute_annotation_meta_path').absolute(),
+                'data_source': Path('/absolute_source_path').absolute(),
+                'annotation': Path('/absolute_annotation_path').absolute(),
             }]
         }]}
 
         expected = copy.deepcopy(local_config['models'][0]['datasets'][0])
-        expected['annotation'] = Path('/absolute_annotation_path')
-        expected['dataset_meta'] = Path('/absolute_annotation_meta_path')
-        expected['data_source'] = Path('/absolute_source_path')
+        expected['annotation'] = Path('/absolute_annotation_path').absolute()
+        expected['dataset_meta'] = Path('/absolute_annotation_meta_path').absolute()
+        expected['data_source'] = Path('/absolute_source_path').absolute()
 
         ConfigReader._merge_paths_with_prefixes(self.arguments, local_config)
 
@@ -431,7 +503,7 @@ def test_expand_relative_paths_in_pipeline_stage_dataset_config_using_command_li
                 'segmentation_masks_source': 'relative_source_path',
                 'annotation': 'relative_annotation_path'
             }
-        launcher_config = {'framework': 'dlsdk', 'model': '/absolute_path', 'weights': '/absolute_path'}
+        launcher_config = {'framework': 'dlsdk', 'model': Path('/absolute_path').absolute(), 'weights': '/absolute_path'}
         pipelines_config = [
             {
                 'name': 'pipeline', 'device_info': [{'framework': 'caffe', 'device': 'CPU'}],
@@ -499,11 +571,11 @@ def test_not_modify_absolute_paths_in_pipeline_stage_dataset_config_using_comman
     def test_merge_launcher_with_device_info(self, mocker):
         dataset_config = {
             'name': 'global_dataset',
-            'dataset_meta': '/absolute_annotation_meta_path',
-            'data_source': '/absolute_source_path',
-            'annotation': '/absolute_annotation_path'
+            'dataset_meta': Path('/absolute_annotation_meta_path').absolute(),
+            'data_source': Path('/absolute_source_path').absolute(),
+            'annotation': Path('/absolute_annotation_path').absolute()
         }
-        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path'), 'weights': Path('/absolute_path')}
+        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}
         device_info = {'device': 'CPU'}
         expected = copy.deepcopy(launcher_config)
         expected.update(device_info)
@@ -528,11 +600,11 @@ def test_merge_launcher_with_device_info(self, mocker):
     def test_merge_launcher_with_target_deivce_in_pipeline(self, mocker):
         dataset_config = {
             'name': 'global_dataset',
-            'dataset_meta': '/absolute_annotation_meta_path',
-            'data_source': '/absolute_source_path',
-            'annotation': '/absolute_annotation_path'
+            'dataset_meta': Path('/absolute_annotation_meta_path').absolute(),
+            'data_source': Path('/absolute_source_path').absolute(),
+            'annotation': Path('/absolute_annotation_path').absolute()
         }
-        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path'), 'weights': Path('/absolute_path')}
+        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}
         device_info = {'device': 'CPU'}
         expected = copy.deepcopy(launcher_config)
         expected.update(device_info)
@@ -559,11 +631,11 @@ def test_merge_launcher_with_target_deivce_in_pipeline(self, mocker):
     def test_merge_launcher_with_2_device_info(self, mocker):
         dataset_config = {
             'name': 'global_dataset',
-            'dataset_meta': '/absolute_annotation_meta_path',
-            'data_source': '/absolute_source_path',
-            'annotation': '/absolute_annotation_path'
+            'dataset_meta': Path('/absolute_annotation_meta_path').absolute(),
+            'data_source': Path('/absolute_source_path').absolute(),
+            'annotation': Path('/absolute_annotation_path').absolute()
         }
-        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path'), 'weights': Path('/absolute_path')}
+        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}
         device_info = [{'device': 'CPU'}, {'device': 'GPU'}]
         expected = [copy.deepcopy(launcher_config), copy.deepcopy(launcher_config)]
         expected[0].update(device_info[0])
@@ -590,11 +662,11 @@ def test_merge_launcher_with_2_device_info(self, mocker):
     def test_merge_launcher_with_2_target_devices(self, mocker):
         dataset_config = {
             'name': 'global_dataset',
-            'dataset_meta': '/absolute_annotation_meta_path',
-            'data_source': '/absolute_source_path',
-            'annotation': '/absolute_annotation_path'
+            'dataset_meta': Path('/absolute_annotation_meta_path').absolute(),
+            'data_source': Path('/absolute_source_path').absolute(),
+            'annotation': Path('/absolute_annotation_path').absolute()
         }
-        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path'), 'weights': Path('/absolute_path')}
+        launcher_config = {'framework': 'caffe', 'model': Path('/absolute_path').absolute(), 'weights': Path('/absolute_path').absolute()}
         device_info = [{'device': 'CPU'}, {'device': 'GPU'}]
         expected = [copy.deepcopy(launcher_config), copy.deepcopy(launcher_config)]
         expected[0].update(device_info[0])
@@ -647,11 +719,11 @@ def test_merge_launchers_with_definitions(self, mocker):
     def test_merge_launchers_with_model_is_not_modified(self, mocker):
         local_config = {'models': [{
             'name': 'model',
-            'launchers': [{'framework': 'dlsdk', 'model': 'custom'}],
+            'launchers': [{'framework': 'dlsdk', 'model': Path('/custom').absolute()}],
             'datasets': [{'name': 'global_dataset'}]
         }]}
         expected = copy.deepcopy(self.get_global_launcher('dlsdk'))
-        expected['model'] = 'custom'
+        expected['model'] = Path('/custom').absolute()
         mocker.patch(self.module + '._read_configs', return_value=(
             self.global_config, local_config
         ))
@@ -714,15 +786,15 @@ def test_both_launchers_are_filtered_by_target_tags_if_tags_not_provided_in_conf
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': '/absolute_path1',
-                'weights': '/absolute_path1',
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
             },
             {
                 'framework': 'dlsdk',
-                'model': '/absolute_path2',
-                'weights': '/absolute_path2',
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
             }
@@ -743,8 +815,8 @@ def test_launcher_is_not_filtered_by_the_same_tag(self, mocker):
         config_launchers = [{
             'framework': 'dlsdk',
             'tags': ['some_tag'],
-            'model': Path('/absolute_path1'),
-            'weights': Path('/absolute_path1'),
+            'model': Path('/absolute_path1').absolute(),
+            'weights': Path('/absolute_path1').absolute(),
             'adapter': 'classification',
             'device': 'CPU',
             '_model_optimizer': self.arguments.model_optimizer,
@@ -755,6 +827,8 @@ def test_launcher_is_not_filtered_by_the_same_tag(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_tags = ['some_tag']
 
         config = ConfigReader.merge(args)[0]
@@ -767,8 +841,8 @@ def test_both_launchers_are_not_filtered_by_the_same_tag(self, mocker):
             {
                 'framework': 'dlsdk',
                 'tags': ['some_tag'],
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -777,8 +851,8 @@ def test_both_launchers_are_not_filtered_by_the_same_tag(self, mocker):
             {
                 'framework': 'dlsdk',
                 'tags': ['some_tag'],
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -790,11 +864,16 @@ def test_both_launchers_are_not_filtered_by_the_same_tag(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_tags = ['some_tag']
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == config_launchers
 
     def test_both_launchers_are_filtered_by_another_tag(self, mocker):
@@ -802,8 +881,8 @@ def test_both_launchers_are_filtered_by_another_tag(self, mocker):
             {
                 'framework': 'dlsdk',
                 'tags': ['some_tag'],
-                'model': '/absolute_path1',
-                'weights': '/absolute_path1',
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -812,8 +891,8 @@ def test_both_launchers_are_filtered_by_another_tag(self, mocker):
             {
                 'framework': 'dlsdk',
                 'tags': ['some_tag'],
-                'model': '/absolute_path2',
-                'weights': '/absolute_path2',
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -837,8 +916,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_tag(self, mocker):
             {
                 'framework': 'dlsdk',
                 'tags': ['tag1'],
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -847,8 +926,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_tag(self, mocker):
             {
                 'framework': 'caffe',
                 'tags': ['tag2'],
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -875,8 +954,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_tag_if_provided_severa
             {
                 'framework': 'dlsdk',
                 'tags': ['tag1'],
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -885,8 +964,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_tag_if_provided_severa
             {
                 'framework': 'caffe',
                 'tags': ['tag2'],
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -913,8 +992,8 @@ def test_launcher_with_several_tags_contained_at_least_one_from_target_tegs_is_n
             {
                 'framework': 'dlsdk',
                 'tags': ['tag1', 'tag2'],
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -926,6 +1005,8 @@ def test_launcher_with_several_tags_contained_at_least_one_from_target_tegs_is_n
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_tags = ['tag2']
 
         config = ConfigReader.merge(args)[0]
@@ -939,8 +1020,8 @@ def test_both_launchers_with_different_tags_are_not_filtered_by_the_same_tags(se
             {
                 'framework': 'dlsdk',
                 'tags': ['tag1'],
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -949,8 +1030,8 @@ def test_both_launchers_with_different_tags_are_not_filtered_by_the_same_tags(se
             {
                 'framework': 'dlsdk',
                 'tags': ['tag2'],
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -962,18 +1043,23 @@ def test_both_launchers_with_different_tags_are_not_filtered_by_the_same_tags(se
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_tags = ['tag1', 'tag2']
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == config_launchers
 
     def test_launcher_is_not_filtered_by_the_same_framework(self, mocker):
         config_launchers = [{
             'framework': 'dlsdk',
-            'model': Path('/absolute_path1'),
-            'weights': Path('/absolute_path1'),
+            'model': Path('/absolute_path1').absolute(),
+            'weights': Path('/absolute_path1').absolute(),
             'adapter': 'classification',
             'device': 'CPU',
             '_model_optimizer': self.arguments.model_optimizer,
@@ -984,6 +1070,8 @@ def test_launcher_is_not_filtered_by_the_same_framework(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_framework = 'dlsdk'
 
         config = ConfigReader.merge(args)[0]
@@ -995,8 +1083,8 @@ def test_both_launchers_are_not_filtered_by_the_same_framework(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1004,8 +1092,8 @@ def test_both_launchers_are_not_filtered_by_the_same_framework(self, mocker):
             },
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1017,18 +1105,23 @@ def test_both_launchers_are_not_filtered_by_the_same_framework(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_framework = 'dlsdk'
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == config_launchers
 
     def test_launcher_is_filtered_by_another_framework(self, mocker):
         config_launchers = [{
             'framework': 'dlsdk',
-            'model': Path('/absolute_path'),
-            'weights': Path('/absolute_path'),
+            'model': Path('/absolute_path').absolute(),
+            'weights': Path('/absolute_path').absolute(),
             'adapter': 'classification',
             '_model_optimizer': self.arguments.model_optimizer,
             '_models_prefix': self.arguments.models
@@ -1050,8 +1143,8 @@ def test_both_launchers_are_filtered_by_another_framework(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': '/absolute_path1',
-                'weights': '/absolute_path1',
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1059,8 +1152,8 @@ def test_both_launchers_are_filtered_by_another_framework(self, mocker):
             },
             {
                 'framework': 'dlsdk',
-                'model': '/absolute_path2',
-                'weights': '/absolute_path2',
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1085,8 +1178,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_framework(self, mocker
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1094,8 +1187,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_framework(self, mocker
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU'
             }
@@ -1118,8 +1211,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_framework(self, mocker
     def test_launcher_is_not_filtered_by_the_same_device(self, mocker):
         config_launchers = [{
             'framework': 'dlsdk',
-            'model': Path('/absolute_path1'),
-            'weights': Path('/absolute_path1'),
+            'model': Path('/absolute_path1').absolute(),
+            'weights': Path('/absolute_path1').absolute(),
             'adapter': 'classification',
             'device': 'CPU',
             '_model_optimizer': self.arguments.model_optimizer,
@@ -1130,6 +1223,8 @@ def test_launcher_is_not_filtered_by_the_same_device(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.model_optimizer = None
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_devices = ['CPU']
 
         config = ConfigReader.merge(args)[0]
@@ -1141,8 +1236,8 @@ def test_both_launchers_are_not_filtered_by_the_same_device(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1150,8 +1245,8 @@ def test_both_launchers_are_not_filtered_by_the_same_device(self, mocker):
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU'
             }
@@ -1160,18 +1255,23 @@ def test_both_launchers_are_not_filtered_by_the_same_device(self, mocker):
         mocker.patch(self.module + '._read_configs', return_value=(None, local_config))
         args = copy.deepcopy(self.arguments)
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_devices = ['CPU']
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == config_launchers
 
     def test_launcher_is_filtered_by_another_device(self, mocker):
         config_launchers = [{
             'framework': 'dlsdk',
-            'model': Path('/absolute_path1'),
-            'weights': Path('/absolute_path1'),
+            'model': Path('/absolute_path1').absolute(),
+            'weights': Path('/absolute_path1').absolute(),
             'adapter': 'classification',
             'device': 'CPU',
             '_model_optimizer': self.arguments.model_optimizer,
@@ -1192,8 +1292,8 @@ def test_both_launchers_are_filtered_by_another_device(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1201,8 +1301,8 @@ def test_both_launchers_are_filtered_by_another_device(self, mocker):
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU'
             }
@@ -1225,8 +1325,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_device(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1234,8 +1334,8 @@ def test_only_appropriate_launcher_is_filtered_by_another_device(self, mocker):
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU'
             }
@@ -1256,8 +1356,8 @@ def test_only_appropriate_launcher_is_filtered_by_user_input_devices(self, mocke
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1265,8 +1365,8 @@ def test_only_appropriate_launcher_is_filtered_by_user_input_devices(self, mocke
             },
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'HETERO:CPU,GPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1274,8 +1374,8 @@ def test_only_appropriate_launcher_is_filtered_by_user_input_devices(self, mocke
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU',
             }
@@ -1285,26 +1385,31 @@ def test_only_appropriate_launcher_is_filtered_by_user_input_devices(self, mocke
         mocker.patch(self.module + '._read_configs', return_value=(None, local_config))
         args = copy.deepcopy(self.arguments)
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_devices = ['GPU', 'CPU']
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == [config_launchers[0], config_launchers[2]]
 
     def test_both_launchers_are_filtered_by_other_devices(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': '/absolute_path1',
-                'weights': '/absolute_path1',
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
             },
             {
                 'framework': 'caffe',
-                'model': '/absolute_path2',
-                'weights': '/absolute_path2',
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU'
             }
@@ -1326,8 +1431,8 @@ def test_both_launchers_are_not_filtered_by_same_devices(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1335,8 +1440,8 @@ def test_both_launchers_are_not_filtered_by_same_devices(self, mocker):
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU'
             }
@@ -1345,19 +1450,24 @@ def test_both_launchers_are_not_filtered_by_same_devices(self, mocker):
         mocker.patch(self.module + '._read_configs', return_value=(None, local_config))
         args = copy.deepcopy(self.arguments)
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_devices = ['GPU', 'CPU']
 
         config = ConfigReader.merge(args)[0]
 
-        launchers = config['models'][0]['launchers']
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert launchers == config_launchers
 
     def test_launcher_is_not_filtered_by_device_with_tail(self, mocker):
         config_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1365,8 +1475,8 @@ def test_launcher_is_not_filtered_by_device_with_tail(self, mocker):
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'GPU'
             }
@@ -1375,6 +1485,8 @@ def test_launcher_is_not_filtered_by_device_with_tail(self, mocker):
         mocker.patch(self.module + '._read_configs', return_value=(None, local_config))
         args = copy.deepcopy(self.arguments)
         args.converted_models = None
+        args.extensions = None
+        args.bitstreams = None
         args.target_devices = ['CPU', 'GPU_unexpected_tail']
 
         config = ConfigReader.merge(args)[0]
@@ -1387,8 +1499,8 @@ def test_all_model_launchers_filtered_in_config_with_several_models(self, mocker
         model1_launchers = [
             {
                 'framework': 'dlsdk',
-                'model': Path('/absolute_path1'),
-                'weights': Path('/absolute_path1'),
+                'model': Path('/absolute_path1').absolute(),
+                'weights': Path('/absolute_path1').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU',
                 '_model_optimizer': self.arguments.model_optimizer,
@@ -1396,8 +1508,8 @@ def test_all_model_launchers_filtered_in_config_with_several_models(self, mocker
             },
             {
                 'framework': 'caffe',
-                'model': Path('/absolute_path2'),
-                'weights': Path('/absolute_path2'),
+                'model': Path('/absolute_path2').absolute(),
+                'weights': Path('/absolute_path2').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU'
             }
@@ -1405,7 +1517,7 @@ def test_all_model_launchers_filtered_in_config_with_several_models(self, mocker
         model2_launchers = [
             {
                 'framework': 'tf',
-                'model': Path('/absolute_path3'),
+                'model': Path('/absolute_path3').absolute(),
                 'adapter': 'classification',
                 'device': 'CPU'
             }
@@ -1430,8 +1542,8 @@ def test_replace_empty_device_by_target_in_models_mode(self, mocker):
                 'name': 'model',
                 'launchers': [{
                     'framework': 'caffe',
-                    'model': Path('/absolute_path2'),
-                    'weights': Path('/absolute_path2'),
+                    'model': Path('/absolute_path2').absolute(),
+                    'weights': Path('/absolute_path2').absolute(),
                     'adapter': 'classification',
             }],
                 'datasets': [{'name': 'dataset'}]}]
@@ -1451,8 +1563,8 @@ def test_replace_empty_device_by_several_targets_in_models_mode(self, mocker):
                 'name': 'model',
                 'launchers': [{
                     'framework': 'caffe',
-                    'model': Path('/absolute_path2'),
-                    'weights': Path('/absolute_path2'),
+                    'model': Path('/absolute_path2').absolute(),
+                    'weights': Path('/absolute_path2').absolute(),
                     'adapter': 'classification',
             }],
                 'datasets': [{'name': 'dataset'}]}]
@@ -1461,8 +1573,10 @@ def test_replace_empty_device_by_several_targets_in_models_mode(self, mocker):
         args = copy.deepcopy(self.arguments)
         args.target_devices = ['CPU', 'GPU']
         config, _ = ConfigReader.merge(args)
-        launchers = config['models'][0]['launchers']
-        assert len(launchers) == 2
+        assert len(config['models']) == 2
+        assert len(config['models'][0]['launchers']) == 1
+        assert len(config['models'][1]['launchers']) == 1
+        launchers = [config['models'][0]['launchers'][0], config['models'][1]['launchers'][0]]
         assert 'device' in launchers[0]
         assert 'device' in launchers[1]
         assert launchers[0]['device'].upper() == 'CPU'
diff --git a/tools/accuracy_checker/tests/test_dataset.py b/tools/accuracy_checker/tests/test_dataset.py
index 8299260ddcd..f48a48b89e0 100644
--- a/tools/accuracy_checker/tests/test_dataset.py
+++ b/tools/accuracy_checker/tests/test_dataset.py
@@ -182,6 +182,114 @@ def test_annoation_conversion_subset_more_than_dataset_size(self, mocker):
             annotation = dataset.annotation
             assert annotation == converted_annotation
 
+    def test_annotation_conversion_with_zero_subset_size(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': 0
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_with_negative_subset_size(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': -1
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_negative_subset_ratio_raise_config_error(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': '-50%'
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_zero_subset_ratio_raise_config_error(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': '0%'
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_invalid_subset_ratio_raise_config_error(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': 'aaa%'
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_invalid_subset_size_raise_config_error(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': 'aaa'
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        with pytest.raises(ConfigError):
+            Dataset(config)
+
+    def test_annotation_conversion_closer_to_zero_subset_ratio(self, mocker):
+        addition_options = {
+            'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
+            'subsample_size': '0.001%'
+        }
+        config = copy_dataset_config(self.dataset_config)
+        config.update(addition_options)
+        converted_annotation = make_representation(['0 0 0 5 5', '0 1 1 10 10'], True)
+        mocker.patch(
+            'accuracy_checker.annotation_converters.WiderFormatConverter.convert',
+            return_value=ConverterReturn(converted_annotation, None, None)
+        )
+        subset_maker_mock = mocker.patch(
+            'accuracy_checker.dataset.make_subset'
+        )
+        Dataset(config)
+        subset_maker_mock.assert_called_once_with(converted_annotation, 1, 666)
+
     def test_annotation_conversion_subset_with_seed(self, mocker):
         addition_options = {
             'annotation_conversion': {'converter': 'wider', 'annotation_file': Path('file')},
diff --git a/tools/accuracy_checker/tests/test_dlsdk_launcher.py b/tools/accuracy_checker/tests/test_dlsdk_launcher.py
index 899973030ee..b451c604f30 100644
--- a/tools/accuracy_checker/tests/test_dlsdk_launcher.py
+++ b/tools/accuracy_checker/tests/test_dlsdk_launcher.py
@@ -34,14 +34,6 @@
 from accuracy_checker.data_readers import DataRepresentation
 from accuracy_checker.utils import contains_all
 
-def check_no_gpu():
-    try:
-        import openvino.inference_engine as ie
-        gpu_plugin = ie.IEPlugin('GPU')
-        del gpu_plugin
-        return False
-    except (ImportError, RuntimeError):
-        return True
 
 @pytest.fixture()
 def mock_inference_engine(mocker):
@@ -107,7 +99,7 @@ def test_dlsd_launcher_set_batch_size(self, models_dir):
         dlsdk_test_model = get_dlsdk_test_model(models_dir, {'batch': 2})
         assert dlsdk_test_model.batch == 2
 
-@pytest.mark.skipif(check_no_gpu(), reason="GPU is not installed")
+
 @pytest.mark.usefixtures('mock_path_exists')
 class TestDLSDKLauncherAffinity:
     def test_dlsdk_launcher_valid_affinity_map(self, mocker, models_dir):
@@ -117,7 +109,7 @@ def test_dlsdk_launcher_valid_affinity_map(self, mocker, models_dir):
             'accuracy_checker.launcher.dlsdk_launcher.read_yaml', return_value=affinity_map
         )
 
-        dlsdk_test_model = get_dlsdk_test_model(models_dir, {'device' : 'HETERO:CPU,GPU', 'affinity_map': './affinity_map.yml'})
+        dlsdk_test_model = get_dlsdk_test_model(models_dir, {'device' : 'HETERO:CPU,GPU', 'affinity_map' : './affinity_map.yml'})
         layers = dlsdk_test_model.network.layers
         for key, value in affinity_map.items():
             assert layers[key].affinity == value
@@ -144,75 +136,7 @@ def test_dlsdk_launcher_affinity_map_invalid_layer(self, mocker, models_dir):
 
 
 @pytest.mark.usefixtures('mock_path_exists', 'mock_inference_engine', 'mock_inputs')
-class TestDLSDKLauncherMultiDevice:
-    def test_multi_device_launcher_creation(self):
-        launcher_config = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU,GPU', 'async_mode': True
-        }
-        launcher = create_launcher(launcher_config)
-        assert launcher.async_mode
-        assert launcher.num_requests == 4
-
-    def test_multi_device_launcher_creation_with_num_requests_as_one_value(self):
-        launcher_config = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU,GPU', 'async_mode': True,
-            'num_requests': 2
-        }
-        launcher = create_launcher(launcher_config)
-        assert launcher.async_mode
-        assert launcher.num_requests == 8
-
-    def test_multi_device_launcher_creation_with_num_requests_as_list(self):
-        launcher_config = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU,GPU', 'async_mode': True,
-            'num_requests': '1,2'
-        }
-        launcher = create_launcher(launcher_config)
-        assert launcher.async_mode
-        assert launcher.num_requests == 6
-
-    def test_multi_device_launcher_creation_with_num_requests_not_for_all_devices_raise_error(self):
-        launcher_config_1 = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU,GPU,FPGA',
-            'async_mode': True,
-            'num_requests': '1,2'
-        }
-        launcher_config_2 = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU(1),GPU(2),FPGA',
-            'async_mode': True,
-        }
-        with pytest.raises(ConfigError):
-            create_launcher(launcher_config_1)
-
-        with pytest.raises(ConfigError):
-            create_launcher(launcher_config_2)
-
-    def test_multi_device_launcher_creation_warn_if_not_async_mode(self):
-        launcher_config = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU,GPU'
-        }
-        with pytest.warns(None) as warnings:
-            launcher = create_launcher(launcher_config)
-            assert len(warnings) == 1
-            assert warnings[0].message.args[0] == 'Using multi device in sync mode non-applicable. Async mode will be used.'
-            assert launcher.async_mode
-            assert launcher.num_requests == 4
-
-    def test_multi_device_launcher_creation_warn_if_num_requests_in_device_string_and_confid_field_both_provided(self):
-        launcher_config = {
-            'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'device': 'MULTI:CPU(2),GPU(3)',
-            'async_mode': True, 'num_requests': 2
-        }
-        with pytest.warns(None) as warnings:
-            launcher = create_launcher(launcher_config)
-            assert len(warnings) == 1
-            assert warnings[0].message.args[0] == "number requests already provided in device name specification. 'num_requests' option will be ignored."
-            assert launcher.async_mode
-            assert launcher.num_requests == 10
-
-
-@pytest.mark.usefixtures('mock_path_exists', 'mock_inference_engine', 'mock_inputs')
-class TestDLSDKLauncherBitstreamProgramming:
+class TestDLSDKLauncher:
     def test_program_bitsream_when_device_is_fpga(self, mocker):
         subprocess_mock = mocker.patch('subprocess.run')
         config = {
@@ -409,9 +333,6 @@ def test_does_not_set_dla_aocx_if_compiler_mode_3_in_env_when_fpga_in_device(sel
 
         os.environ.__setitem__.assert_not_called()
 
-
-@pytest.mark.usefixtures('mock_path_exists', 'mock_inference_engine', 'mock_inputs')
-class TestDLSDKLauncherModels:
     def test_model_converted_from_caffe(self, mocker):
         mock = mocker.patch(
             'accuracy_checker.launcher.dlsdk_launcher.convert_model',
@@ -433,7 +354,7 @@ def test_model_converted_from_caffe(self, mocker):
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '/path/to/source_models/custom_weights', '',
             FrameworkParameters('caffe', False),
-            [], None, None, None, None, should_log_cmd=False
+            [], None, None, None, None, None, should_log_cmd=False
         )
 
     def test_model_converted_with_mo_params(self, mocker):
@@ -458,7 +379,7 @@ def test_model_converted_with_mo_params(self, mocker):
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '/path/to/source_models/custom_weights', '',
             FrameworkParameters('caffe', False),
-            [], {'data_type': 'FP16'}, None, None, None, should_log_cmd=False
+            [], {'data_type': 'FP16'}, None, None, None, None, should_log_cmd=False
         )
 
     def test_model_converted_with_mo_flags(self, mocker):
@@ -484,7 +405,7 @@ def test_model_converted_with_mo_flags(self, mocker):
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '/path/to/source_models/custom_weights', '',
             FrameworkParameters('caffe', False),
-            [], None, ['reverse_input_channels'], None, None, should_log_cmd=False
+            [], None, ['reverse_input_channels'], None, None, None, should_log_cmd=False
         )
 
     def test_model_converted_to_output_dir_in_mo_params(self, mocker):
@@ -530,7 +451,7 @@ def test_model_converted_from_tf(self, mocker):
 
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '', '',
-            FrameworkParameters('tf', False), [], None, None, None, None,
+            FrameworkParameters('tf', False), [], None, None, None, None, None,
             should_log_cmd=False
         )
 
@@ -552,7 +473,7 @@ def test_model_converted_from_tf_checkpoint(self, mocker):
 
         mock.assert_called_once_with(
             'custom_model', '', '', '/path/to/source_models/custom_model',
-            FrameworkParameters('tf', True), [], None, None, None, None,
+            FrameworkParameters('tf', True), [], None, None, None, None, None,
             should_log_cmd=False
         )
 
@@ -570,10 +491,10 @@ def test_model_converted_from_tf_with_arg_path_to_custom_tf_config(self, mocker)
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_model': '/path/to/source_models/custom_model',
+            'input_model': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_use_custom_operations_config': 'config/dir/ssd_v2_support.json'
+            'tensorflow_use_custom_operations_config': str(Path('config/dir/ssd_v2_support.json'))
         }
 
         mocker.patch(
@@ -581,7 +502,8 @@ def test_model_converted_from_tf_with_arg_path_to_custom_tf_config(self, mocker)
             return_value=subprocess.CompletedProcess(args, returncode=0)
         )
         DLSDKLauncher(config)
-        prepare_args_patch.assert_called_once_with('/path/ModelOptimizer', flag_options=[], value_options=args)
+        mo_path = str(Path('/path/ModelOptimizer'))
+        prepare_args_patch.assert_called_once_with(mo_path, flag_options=[], value_options=args)
 
     def test_model_converted_from_tf_with_default_path_to_custom_tf_config(self, mocker):
         config = {
@@ -596,10 +518,10 @@ def test_model_converted_from_tf_with_default_path_to_custom_tf_config(self, moc
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_model': '/path/to/source_models/custom_model',
+            'input_model': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_use_custom_operations_config': '/path/extensions/front/tf/config.json'
+            'tensorflow_use_custom_operations_config': str(Path('/path/extensions/front/tf/config.json'))
         }
 
         mocker.patch(
@@ -607,7 +529,7 @@ def test_model_converted_from_tf_with_default_path_to_custom_tf_config(self, moc
             return_value=subprocess.CompletedProcess(args, returncode=0)
         )
         DLSDKLauncher(config)
-        prepare_args_patch.assert_called_once_with('/path/ModelOptimizer', flag_options=[], value_options=args)
+        prepare_args_patch.assert_called_once_with(str(Path('/path/ModelOptimizer')), flag_options=[], value_options=args)
 
     def test_model_converted_from_tf_with_default_path_to_obj_detection_api_config(self, mocker):
         config = {
@@ -623,10 +545,10 @@ def test_model_converted_from_tf_with_default_path_to_obj_detection_api_config(s
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_model': '/path/to/source_models/custom_model',
+            'input_model': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_object_detection_api_pipeline_config': '/path/to/source_models/operations.config'
+            'tensorflow_object_detection_api_pipeline_config': str(Path('/path/to/source_models/operations.config'))
         }
 
         mocker.patch(
@@ -634,7 +556,7 @@ def test_model_converted_from_tf_with_default_path_to_obj_detection_api_config(s
             return_value=subprocess.CompletedProcess(args, returncode=0)
         )
         DLSDKLauncher(config)
-        prepare_args_patch.assert_called_once_with('/path/ModelOptimizer', flag_options=[], value_options=args)
+        prepare_args_patch.assert_called_once_with(str(Path('/path/ModelOptimizer')), flag_options=[], value_options=args)
 
     def test_model_converted_from_tf_with_arg_path_to_obj_detection_api_config(self, mocker):
         config = {
@@ -644,17 +566,16 @@ def test_model_converted_from_tf_with_arg_path_to_obj_detection_api_config(self,
             '_models_prefix': '/path/to',
             'adapter': 'classification',
             'mo_params': {'tensorflow_object_detection_api_pipeline_config': 'operations.config'},
-            '_tf_custom_op_config_dir': 'config/dir',
             '_tf_obj_detection_api_pipeline_config_path': 'od_api'
         }
         mocker.patch('accuracy_checker.launcher.model_conversion.find_mo', return_value=Path('/path/ModelOptimizer'))
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_model': '/path/to/source_models/custom_model',
+            'input_model': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_object_detection_api_pipeline_config': 'od_api/operations.config'
+            'tensorflow_object_detection_api_pipeline_config': str(Path('od_api/operations.config'))
         }
 
         mocker.patch(
@@ -704,10 +625,10 @@ def test_model_converted_from_tf_checkpoint_with_default_path_to_custom_tf_confi
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_meta_graph': '/path/to/source_models/custom_model',
+            'input_meta_graph': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_use_custom_operations_config': '/path/extensions/front/tf/config.json'
+            'tensorflow_use_custom_operations_config': str(Path('/path/extensions/front/tf/config.json'))
         }
 
         mocker.patch(
@@ -731,10 +652,10 @@ def test_model_converted_from_tf_checkpoint_with_default_path_to_obj_detection_a
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_meta_graph': '/path/to/source_models/custom_model',
+            'input_meta_graph': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_object_detection_api_pipeline_config': '/path/to/source_models/operations.config'
+            'tensorflow_object_detection_api_pipeline_config': str(Path('/path/to/source_models/operations.config'))
         }
 
         mocker.patch(
@@ -759,10 +680,10 @@ def test_model_converted_from_tf_checkpoint_with_arg_path_to_obj_detection_api_c
         prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
 
         args = {
-            'input_meta_graph': '/path/to/source_models/custom_model',
+            'input_meta_graph': str(Path('/path/to/source_models/custom_model')),
             'model_name': 'custom_model',
             'framework': 'tf',
-            'tensorflow_object_detection_api_pipeline_config': 'od_api/operations.config'
+            'tensorflow_object_detection_api_pipeline_config': str(Path('od_api/operations.config'))
         }
 
         mocker.patch(
@@ -770,7 +691,60 @@ def test_model_converted_from_tf_checkpoint_with_arg_path_to_obj_detection_api_c
             return_value=subprocess.CompletedProcess(args, returncode=0)
         )
         DLSDKLauncher(config)
-        prepare_args_patch.assert_called_once_with('/path/ModelOptimizer', flag_options=[], value_options=args)
+        prepare_args_patch.assert_called_once_with(str(Path('/path/ModelOptimizer')), flag_options=[], value_options=args)
+
+    def test_model_converted_from_tf_checkpoint_with_arg_path_to_transformations_config(self, mocker):
+        config = {
+            'framework': 'dlsdk',
+            'tf_meta': '/path/to/source_models/custom_model',
+            'device': 'cpu',
+            '_models_prefix': '/path/to',
+            'adapter': 'classification',
+            'mo_params': {'transformations_config': 'ssd_v2_support.json'},
+            '_transformations_config_dir': 'config/dir'
+        }
+        mocker.patch('accuracy_checker.launcher.model_conversion.find_mo', return_value=Path('/path/ModelOptimizer'))
+        prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
+
+        args = {
+            'input_meta_graph': str(Path('/path/to/source_models/custom_model')),
+            'model_name': 'custom_model',
+            'framework': 'tf',
+            'transformations_config': str(Path('config/dir/ssd_v2_support.json'))
+        }
+
+        mocker.patch(
+            'accuracy_checker.launcher.model_conversion.exec_mo_binary',
+            return_value=subprocess.CompletedProcess(args, returncode=0)
+        )
+        DLSDKLauncher(config)
+        prepare_args_patch.assert_called_once_with(str(Path('/path/ModelOptimizer')), flag_options=[], value_options=args)
+
+    def test_model_converted_from_tf_checkpoint_with_default_path_to_transformations_config(self, mocker):
+        config = {
+            'framework': 'dlsdk',
+            'tf_meta': '/path/to/source_models/custom_model',
+            'device': 'cpu',
+            '_models_prefix': '/path/to',
+            'adapter': 'classification',
+            'mo_params': {'transformations_config': 'config.json'}
+        }
+        mocker.patch('accuracy_checker.launcher.model_conversion.find_mo', return_value=Path('/path/ModelOptimizer'))
+        prepare_args_patch = mocker.patch('accuracy_checker.launcher.model_conversion.prepare_args')
+
+        args = {
+            'input_meta_graph': str(Path('/path/to/source_models/custom_model')),
+            'model_name': 'custom_model',
+            'framework': 'tf',
+            'transformations_config': str(Path('/path/extensions/front/tf/config.json'))
+        }
+
+        mocker.patch(
+            'accuracy_checker.launcher.model_conversion.exec_mo_binary',
+            return_value=subprocess.CompletedProcess(args, returncode=0)
+        )
+        DLSDKLauncher(config)
+        prepare_args_patch.assert_called_once_with(str(Path('/path/ModelOptimizer')), flag_options=[], value_options=args)
 
     def test_model_converted_from_mxnet(self, mocker):
         mock = mocker.patch(
@@ -790,7 +764,7 @@ def test_model_converted_from_mxnet(self, mocker):
 
         mock.assert_called_once_with(
             'custom_weights', '', '/path/to/source_models/custom_weights', '',
-            FrameworkParameters('mxnet', False), [], None, None, None, None,
+            FrameworkParameters('mxnet', False), [], None, None, None, None, None,
             should_log_cmd=False
         )
 
@@ -812,7 +786,7 @@ def test_model_converted_from_onnx(self, mocker):
 
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '', '',
-            FrameworkParameters('onnx', False), [], None, None, None, None,
+            FrameworkParameters('onnx', False), [], None, None, None, None, None,
             should_log_cmd=False
         )
 
@@ -834,7 +808,7 @@ def test_model_converted_from_kaldi(self, mocker):
 
         mock.assert_called_once_with(
             'custom_model', '/path/to/source_models/custom_model', '', '',
-            FrameworkParameters('kaldi', False), [], None, None, None, None,
+            FrameworkParameters('kaldi', False), [], None, None, None, None, None,
             should_log_cmd=False
         )
 
@@ -1127,46 +1101,6 @@ def test_hetero_endswith_comma(self):
         with pytest.raises(ConfigError):
             self.config.validate(update_dict(self.launcher, device='HETERO:CPU,FPGA,'))
 
-    def test_multi_device_correct(self):
-        self.config.validate(update_dict(self.launcher, device='MULTI:CPU'))
-        self.config.validate(update_dict(self.launcher, device='MULTI:CPU,FPGA'))
-        self.config.validate(update_dict(self.launcher, device='MULTI:CPU(1),FPGA(2)'))
-
-    def test_multi_device_endswith_comma(self):
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU,FPGA,'))
-
-    def test_multi_device_empty_brackets(self):
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU,FPGA()'))
-
-    def test_multi_device_n_requests_without_brackets(self):
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU(42),FPGA666'))
-
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU42,FPGA(666)'))
-
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU42,FPGA666'))
-
-    def test_multi_device_missed_bracket(self):
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU(42,FPGA(666)'))
-
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU(42),FPGA666)'))
-
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU42),FPGA(666)'))
-
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:CPU(42),FPGA(666'))
-
-    def test_multi_device_empty(self):
-        with pytest.raises(ConfigError):
-            self.config.validate(update_dict(self.launcher, device='MULTI:'))
-
     def test_normal_multiple_devices(self):
         with pytest.raises(ConfigError):
             self.config.validate(update_dict(self.launcher, device='CPU,FPGA'))
@@ -1202,19 +1136,19 @@ def test_undefined_str_adapter_in_create_dlsdk_launcher_raises_config_error_exce
         with pytest.raises(ConfigError):
             create_launcher(launcher_config)
 
-    def test_empty_dict_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
+    def test_empty_dir_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
         launcher_config = {'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'adapter': {}}
 
         with pytest.raises(ConfigError):
             create_launcher(launcher_config)
 
-    def test_missed_type_in_dict_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
+    def test_missed_type_in_dir_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
         launcher_config = {'framework': 'dlsdk', 'model': 'custom', 'weights': 'custom', 'adapter': {'key': 'val'}}
 
         with pytest.raises(ConfigError):
             create_launcher(launcher_config)
 
-    def test_undefined_type_in_dict_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
+    def test_undefined_type_in_dir_adapter_in_create_dlsdk_launcher_raises_config_error_exception(self):
         launcher_config = {
             'framework': 'dlsdk',
             'model': 'custom',
@@ -1247,3 +1181,7 @@ def test_dlsdk_launcher_model_no_image_inputs_raise_value_error(self):
 
         with pytest.raises(ValueError):
             create_launcher(launcher_config)
+
+
+def dummy_adapter():
+    pass
diff --git a/tools/accuracy_checker/tests/test_input_feeder.py b/tools/accuracy_checker/tests/test_input_feeder.py
index 013896bb1ff..ebba6d5730e 100644
--- a/tools/accuracy_checker/tests/test_input_feeder.py
+++ b/tools/accuracy_checker/tests/test_input_feeder.py
@@ -273,3 +273,56 @@ def test_fill_non_const_input_with_multi_infer_not_consistent_data_batch_2(self)
         assert len(result) == len(expected)
         assert np.array_equal(result[0]['input'], expected[0]['input'])
         assert np.array_equal(result[1]['input'], expected[1]['input'])
+
+    def test_set_input_precision_for_constant_input(self):
+        input_feeder = InputFeeder(
+            [{'name': 'input_u8', 'type': 'CONST_INPUT', 'value': [1, 2, 3], 'precision': 'U8'}],
+            {'input': (1, 3, 10, 10), 'input_u8': (3,)})
+        assert input_feeder.const_inputs['input_u8'].dtype == np.uint8
+
+    def test_set_invalid_input_precision_for_constant_input_raise_config_error(self):
+        with pytest.raises(ConfigError):
+            InputFeeder(
+                [{'name': 'input_u8', 'type': 'CONST_INPUT', 'value': [1, 2, 3], 'precision': 'U2'}],
+                {'input': (1, 3, 10, 10), 'input_u8': (3,)})
+
+    def test_set_input_precision_for_non_constant_input(self):
+        input_feeder = InputFeeder(
+            [{'name': 'input_u8', 'type': 'INPUT', 'precision': 'U8'}],
+            {'input_u8': (1, 3,10, 10)})
+        result = input_feeder.fill_non_constant_inputs([
+            DataRepresentation(
+                np.zeros((10, 10, 3)),
+                identifier='0'
+            ),
+        ])
+        expected = [{'input_u8': np.zeros((1, 3, 10, 10), dtype=np.uint8)}]
+        assert len(result) == len(expected)
+        assert np.array_equal(result[0]['input_u8'], expected[0]['input_u8'])
+        assert result[0]['input_u8'].dtype == expected[0]['input_u8'].dtype
+
+    def test_set_invalid_input_precision_for_non_constant_input_raise_config_error(self):
+        with pytest.raises(ConfigError):
+            InputFeeder([{'name': 'input', 'type': 'INPUT', 'precision': 'U2'}], {'input': (1, 3, 10, 10)})
+
+    def test_set_input_precision_for_image_info_input(self):
+        input_feeder = InputFeeder(
+            [{'name': 'im_info', 'type': 'IMAGE_INFO', 'precision': 'U8'}],
+            {'input': (1, 3,10, 10), 'im_info': (1, 3)})
+        result = input_feeder.fill_non_constant_inputs([
+            DataRepresentation(
+                np.zeros((10, 10, 3)),
+                identifier='0'
+            ),
+        ])
+        expected = [{'input': np.zeros((1, 3, 10, 10)), 'im_info': np.array([[10, 10, 1]], dtype=np.uint8)}]
+        assert len(result) == len(expected)
+        assert np.array_equal(result[0]['input'], expected[0]['input'])
+        assert result[0]['input'].dtype == expected[0]['input'].dtype
+        assert np.array_equal(result[0]['im_info'], expected[0]['im_info'])
+        assert result[0]['im_info'].dtype == expected[0]['im_info'].dtype
+
+    def test_set_invalid_input_precision_for_image_info_input_raise_config_error(self):
+        with pytest.raises(ConfigError):
+            InputFeeder([{'name': 'im_info', 'type': 'IMAGE_INFO', 'precision': 'U2'}],
+                        {'input': (1, 3, 10, 10), 'im_info': (1, 3)})
diff --git a/tools/accuracy_checker/tests/test_metric_evaluator.py b/tools/accuracy_checker/tests/test_metric_evaluator.py
index fc0c4d28f85..44265aed89a 100644
--- a/tools/accuracy_checker/tests/test_metric_evaluator.py
+++ b/tools/accuracy_checker/tests/test_metric_evaluator.py
@@ -16,7 +16,7 @@
 
 import pytest
 from accuracy_checker.config import ConfigError
-from accuracy_checker.metrics import ClassificationAccuracy, MetricsExecutor
+from accuracy_checker.metrics import ClassificationAccuracy, MetricsExecutor, PerImageMetricResult
 from accuracy_checker.metrics.metric import Metric
 from accuracy_checker.representation import (
     ClassificationAnnotation,
@@ -70,7 +70,7 @@ def test_accuracy_on_container_with_wrong_annotation_source_name_raise_config_er
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1, 'annotation_source': 'a'}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_wrong_annotation_type_raise_config_error_exception(self):
         annotations = [DetectionAnnotation('identifier', 3)]
@@ -78,7 +78,7 @@ def test_accuracy_with_wrong_annotation_type_raise_config_error_exception(self):
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_unsupported_annotations_in_container_raise_config_error_exception(self):
         annotations = [ContainerAnnotation({'annotation': DetectionAnnotation('identifier', 3)})]
@@ -86,7 +86,7 @@ def test_accuracy_with_unsupported_annotations_in_container_raise_config_error_e
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_unsupported_annotation_type_as_annotation_source_for_container_raises_config_error(self):
         annotations = [ContainerAnnotation({'annotation': DetectionAnnotation('identifier', 3)})]
@@ -94,7 +94,7 @@ def test_accuracy_with_unsupported_annotation_type_as_annotation_source_for_cont
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1, 'annotation_source': 'annotation'}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_on_annotation_container_with_several_suitable_representations_config_value_error_exception(self):
         annotations = [ContainerAnnotation({
@@ -105,7 +105,7 @@ def test_accuracy_on_annotation_container_with_several_suitable_representations_
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_wrong_prediction_type_raise_config_error_exception(self):
         annotations = [ClassificationAnnotation('identifier', 3)]
@@ -113,7 +113,7 @@ def test_accuracy_with_wrong_prediction_type_raise_config_error_exception(self):
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_unsupported_prediction_in_container_raise_config_error_exception(self):
         annotations = [ClassificationAnnotation('identifier', 3)]
@@ -121,7 +121,7 @@ def test_accuracy_with_unsupported_prediction_in_container_raise_config_error_ex
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_with_unsupported_prediction_type_as_prediction_source_for_container_raises_config_error(self):
         annotations = [ClassificationAnnotation('identifier', 3)]
@@ -129,7 +129,7 @@ def test_accuracy_with_unsupported_prediction_type_as_prediction_source_for_cont
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1, 'prediction_source': 'prediction'}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_accuracy_on_prediction_container_with_several_suitable_representations_raise_config_error_exception(self):
         annotations = [ClassificationAnnotation('identifier', 3)]
@@ -140,14 +140,14 @@ def test_accuracy_on_prediction_container_with_several_suitable_representations_
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
         with pytest.raises(ConfigError):
-            dispatcher.update_metrics_on_batch(annotations, predictions)
+            dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
     def test_complete_accuracy(self):
         annotations = [ClassificationAnnotation('identifier', 3)]
         predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result.name == 'accuracy'
@@ -160,7 +160,7 @@ def test_complete_accuracy_with_container_default_sources(self):
         predictions = [ContainerPrediction({'p': ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])})]
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result.name == 'accuracy'
@@ -174,7 +174,7 @@ def test_complete_accuracy_with_container_sources(self):
         config = [{'type': 'accuracy', 'top_k': 1, 'annotation_source': 'a', 'prediction_source': 'p'}]
 
         dispatcher = MetricsExecutor(config, None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result.name == 'accuracy'
@@ -199,7 +199,7 @@ def test_complete_accuracy_top_3(self):
         predictions = [ClassificationPrediction('identifier', [1.0, 3.0, 4.0, 2.0])]
 
         dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 3}], None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result.name == 'accuracy'
@@ -248,7 +248,7 @@ def test_classification_per_class_accuracy_fully_zero_prediction(self):
         prediction = ClassificationPrediction('identifier', [1.0, 2.0])
         dataset = DummyDataset(label_map={0: '0', 1: '1'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 1}], dataset)
-        dispatcher.update_metrics_on_batch([annotation], [prediction])
+        dispatcher.update_metrics_on_batch(range(1), [annotation], [prediction])
         for _, evaluation_result in dispatcher.iterate_metrics([annotation], [prediction]):
             assert evaluation_result.name == 'accuracy_per_class'
             assert len(evaluation_result.evaluated_value) == 2
@@ -263,7 +263,7 @@ def test_classification_per_class_accuracy_partially_zero_prediction(self):
         dataset = DummyDataset(label_map={0: '0', 1: '1'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 1}], dataset)
 
-        dispatcher.update_metrics_on_batch(annotation, prediction)
+        dispatcher.update_metrics_on_batch(range(len(annotation)), annotation, prediction)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotation, prediction):
             assert evaluation_result.name == 'accuracy_per_class'
@@ -282,7 +282,7 @@ def test_classification_per_class_accuracy_complete_prediction(self):
         dataset = DummyDataset(label_map={0: '0', 1: '1'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 1}], dataset)
 
-        dispatcher.update_metrics_on_batch(annotation, prediction)
+        dispatcher.update_metrics_on_batch(range(len(annotation)), annotation, prediction)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotation, prediction):
             assert evaluation_result.name == 'accuracy_per_class'
@@ -306,7 +306,7 @@ def test_classification_per_class_accuracy_partially_prediction(self):
         dataset = DummyDataset(label_map={0: '0', 1: '1'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 1}], dataset)
 
-        dispatcher.update_metrics_on_batch(annotation, prediction)
+        dispatcher.update_metrics_on_batch(range(len(annotation)), annotation, prediction)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotation, prediction):
             assert evaluation_result.name == 'accuracy_per_class'
@@ -325,7 +325,7 @@ def test_classification_per_class_accuracy_prediction_top3_zero(self):
         dataset = DummyDataset(label_map={0: '0', 1: '1', 2: '2', 3: '3'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 3}], dataset)
 
-        dispatcher.update_metrics_on_batch(annotation, prediction)
+        dispatcher.update_metrics_on_batch(range(len(annotation)), annotation, prediction)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotation, prediction):
             assert evaluation_result.name == 'accuracy_per_class'
@@ -346,7 +346,7 @@ def test_classification_per_class_accuracy_prediction_top3(self):
         dataset = DummyDataset(label_map={0: '0', 1: '1', 2: '2', 3: '3'})
         dispatcher = MetricsExecutor([{'type': 'accuracy_per_class', 'top_k': 3}], dataset)
 
-        dispatcher.update_metrics_on_batch(annotation, prediction)
+        dispatcher.update_metrics_on_batch(range(len(annotation)), annotation, prediction)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotation, prediction):
             assert evaluation_result.name == 'accuracy_per_class'
@@ -359,6 +359,82 @@ def test_classification_per_class_accuracy_prediction_top3(self):
             assert evaluation_result.threshold is None
 
 
+class TestMetricPerInstanceResult:
+    def test_classification_accuracy_result_for_batch_1(self):
+        annotations = [ClassificationAnnotation('identifier', 3)]
+        predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
+
+        dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected_metric_result = PerImageMetricResult('accuracy', 'accuracy', 1.0, 'higher-better')
+        assert len(metric_result) == 1
+        assert 0 in metric_result
+        assert len(metric_result[0]) == 1
+        assert metric_result[0][0] == expected_metric_result
+
+    def test_classification_accuracy_result_for_batch_1_with_named_metric(self):
+        annotations = [ClassificationAnnotation('identifier', 3)]
+        predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
+
+        dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1, 'name': 'accuracy@top1'}], None)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected_metric_result = PerImageMetricResult('accuracy@top1', 'accuracy', 1.0, 'higher-better')
+        assert len(metric_result) == 1
+        assert 0 in metric_result
+        assert len(metric_result[0]) == 1
+        assert metric_result[0][0] == expected_metric_result
+
+    def test_classification_accuracy_result_for_batch_1_with_2_metrics(self):
+        annotations = [ClassificationAnnotation('identifier', 3)]
+        predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
+
+        dispatcher = MetricsExecutor([
+            {'name': 'top1', 'type': 'accuracy', 'top_k': 1}, {'name': 'top3', 'type': 'accuracy', 'top_k': 3}
+        ], None)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected_metric_result = [
+            PerImageMetricResult('top1', 'accuracy', 1.0, 'higher-better'),
+            PerImageMetricResult('top3', 'accuracy', 1.0, 'higher-better')
+        ]
+        assert len(metric_result) == 1
+        assert 0 in metric_result
+        assert len(metric_result[0]) == 2
+        assert metric_result[0][0] == expected_metric_result[0]
+        assert metric_result[0][1] == expected_metric_result[1]
+
+    def test_classification_accuracy_result_for_batch_2(self):
+        annotations = [ClassificationAnnotation('identifier', 3), ClassificationAnnotation('identifier1', 1)]
+        predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0]), ClassificationPrediction('identifier2', [1.0, 1.0, 1.0, 4.0])]
+
+        dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected_metric_result = [PerImageMetricResult('accuracy', 'accuracy', 1.0, 'higher-better'),
+                                  PerImageMetricResult('accuracy', 'accuracy', 0.0, 'higher-better')]
+        assert len(metric_result) == 2
+        assert 0 in metric_result
+        assert len(metric_result[0]) == 1
+        assert metric_result[0][0] == expected_metric_result[0]
+        assert 1 in metric_result
+        assert len(metric_result[1]) == 1
+        assert metric_result[1][0] == expected_metric_result[1]
+
+    def test_classification_accuracy_result_for_batch_2_with_not_ordered_ids(self):
+        annotations = [ClassificationAnnotation('identifier', 3), ClassificationAnnotation('identifier1', 1)]
+        predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0]), ClassificationPrediction('identifier2', [1.0, 1.0, 1.0, 4.0])]
+
+        dispatcher = MetricsExecutor([{'type': 'accuracy', 'top_k': 1}], None)
+        metric_result = dispatcher.update_metrics_on_batch([42, 17], annotations, predictions)
+        expected_metric_result = [PerImageMetricResult('accuracy', 'accuracy', 1.0, 'higher-better'),
+                                  PerImageMetricResult('accuracy', 'accuracy', 0.0, 'higher-better')]
+        assert len(metric_result) == 2
+        assert 42 in metric_result
+        assert len(metric_result[42]) == 1
+        assert metric_result[42][0] == expected_metric_result[0]
+        assert 17 in metric_result
+        assert len(metric_result[17]) == 1
+        assert metric_result[17][0] == expected_metric_result[1]
+
+
 class TestMetricExtraArgs:
     def test_all_metrics_raise_config_error_on_extra_args(self):
         for provider in Metric.providers:
diff --git a/tools/accuracy_checker/tests/test_model_evaluator.py b/tools/accuracy_checker/tests/test_model_evaluator.py
index d4b10a62691..7747363e4d9 100644
--- a/tools/accuracy_checker/tests/test_model_evaluator.py
+++ b/tools/accuracy_checker/tests/test_model_evaluator.py
@@ -45,7 +45,7 @@ def setup_method(self):
         self.annotations = [[annotation_container_0], [annotation_container_1]]
 
         self.dataset = MagicMock()
-        self.dataset.__iter__.return_value = self.annotations
+        self.dataset.__iter__.return_value = [(range(1), self.annotations[0]), (range(1), self.annotations[1])]
 
         self.postprocessor.process_batch = Mock(side_effect=[
             ([annotation_container_0], [annotation_container_0]), ([annotation_container_1], [annotation_container_1])
@@ -185,7 +185,7 @@ def setup_method(self):
         self.annotations = [[annotation_container_0], [annotation_container_1]]
 
         self.dataset = MagicMock()
-        self.dataset.__iter__.return_value = self.annotations
+        self.dataset.__iter__.return_value = [(range(1), self.annotations[0]), (range(1), self.annotations[1])]
 
         self.postprocessor.process_batch = Mock(side_effect=[
             ([annotation_container_0], [annotation_container_0]), ([annotation_container_1], [annotation_container_1])
@@ -218,6 +218,8 @@ def setup_method(self):
 
     def test_process_dataset_without_storing_predictions_and_dataset_processors(self):
         self.postprocessor.has_dataset_processors = False
+        self.launcher.allow_reshape_input = False
+        self.preprocessor.has_multi_infer_transformations = False
 
         self.evaluator.dataset_processor(None, None)
 
@@ -227,19 +229,10 @@ def test_process_dataset_without_storing_predictions_and_dataset_processors(self
         assert self.launcher.predict_async.called
         assert self.metric.update_metrics_on_batch.call_count == len(self.annotations)
 
-    def test_process_dataset_without_storing_predictions_and_with_dataset_processors(self):
-        self.postprocessor.has_dataset_processors = True
-
-        self.evaluator.dataset_processor(None, None)
-
-        assert not self.evaluator.store_predictions.called
-        assert not self.evaluator.load.called
-        assert not self.launcher.predict.called
-        assert self.launcher.predict_async.called
-        assert self.metric.update_metrics_on_batch.call_count == 1
-
     def test_process_dataset_with_storing_predictions_and_without_dataset_processors(self):
         self.postprocessor.has_dataset_processors = False
+        self.launcher.allow_reshape_input = False
+        self.preprocessor.has_multi_infer_transformations = False
 
         self.evaluator.dataset_processor('path', None)
 
@@ -250,20 +243,6 @@ def test_process_dataset_with_storing_predictions_and_without_dataset_processors
         assert self.postprocessor.process_batch.called
         assert self.metric.update_metrics_on_batch.call_count == len(self.annotations)
 
-    def test_process_dataset_with_storing_predictions_and_with_dataset_processors(self):
-        self.postprocessor.has_dataset_processors = True
-
-        self.evaluator.dataset_processor('path', None)
-
-        assert self.evaluator.store_predictions.called
-        assert not self.evaluator.load.called
-        assert not self.launcher.predict.called
-        assert self.launcher.predict_async.called
-        assert self.postprocessor.process_batch.called
-        assert self.metric.update_metrics_on_batch.call_count == 1
-        assert self.postprocessor.process_dataset.called
-        assert not self.postprocessor.full_process.called
-
     def test_process_dataset_with_loading_predictions_and_without_dataset_processors(self, mocker):
         mocker.patch('accuracy_checker.evaluators.model_evaluator.get_path')
         self.postprocessor.has_dataset_processors = False
@@ -277,3 +256,29 @@ def test_process_dataset_with_loading_predictions_and_without_dataset_processors
         assert self.metric.update_metrics_on_batch.call_count == 1
         assert not self.postprocessor.process_dataset.called
         assert self.postprocessor.full_process.called
+
+    def test_switch_to_sync_predict_if_need_reshaping(self):
+        self.postprocessor.has_dataset_processors = False
+        self.launcher.allow_reshape_input = True
+        self.preprocessor.has_multi_infer_transformations = False
+
+        self.evaluator.process_dataset(None, None)
+
+        assert not self.evaluator.store_predictions.called
+        assert not self.evaluator.load.called
+        assert self.launcher.predict.called
+        assert not self.launcher.predict_async.called
+        assert self.metric.update_metrics_on_batch.call_count == len(self.annotations)
+
+    def test_switch_to_sync_predict_if_need_multi_infer(self):
+        self.postprocessor.has_dataset_processors = False
+        self.launcher.allow_reshape_input = False
+        self.preprocessor.has_multi_infer_transformations = True
+
+        self.evaluator.process_dataset(None, None)
+
+        assert not self.evaluator.store_predictions.called
+        assert not self.evaluator.load.called
+        assert self.launcher.predict.called
+        assert not self.launcher.predict_async.called
+        assert self.metric.update_metrics_on_batch.call_count == len(self.annotations)
diff --git a/tools/accuracy_checker/tests/test_onnx_launcher.py b/tools/accuracy_checker/tests/test_onnx_launcher.py
index 42f010c6d51..5b171ad9243 100644
--- a/tools/accuracy_checker/tests/test_onnx_launcher.py
+++ b/tools/accuracy_checker/tests/test_onnx_launcher.py
@@ -23,14 +23,25 @@
 from accuracy_checker.launcher.launcher import create_launcher
 from accuracy_checker.config import ConfigError
 
-
-def get_onnx_test_model(models_dir):
+def old_onnxrunitme(models_dir):
+    import onnxruntime as rt
+    sess = rt.InferenceSession(str(models_dir / "samplenet.onnx"))
+    try:
+        sess.get_providers()
+        return False
+    except AttributeError:
+        return True
+
+def get_onnx_test_model(models_dir, device=None, ep=None):
     config = {
         "framework": "onnx_runtime",
         "model": str(models_dir / "samplenet.onnx"),
         "adapter": "classification",
-        "device": "cpu",
     }
+    if device is not None:
+        config['device'] = device
+    if ep is not None:
+        config['execution_providers'] = ep
     return create_launcher(config)
 
 
@@ -41,16 +52,27 @@ def test_launcher_creates(self, models_dir):
         assert launcher.output_blob == 'fc3'
 
     def test_infer(self, data_dir, models_dir):
-        mx_test_model = get_onnx_test_model(models_dir)
-        _, _, h, w = mx_test_model.inputs['data']
+        onnx_test_model = get_onnx_test_model(models_dir)
+        _, _, h, w = onnx_test_model.inputs['data']
         img_raw = cv2.imread(str(data_dir / '1.jpg'))
         img_rgb = cv2.cvtColor(img_raw, cv2.COLOR_BGR2RGB)
         img_resized = cv2.resize(img_rgb, (w, h))
         input_blob = np.transpose([img_resized], (0, 3, 1, 2))
-        res = mx_test_model.predict([{'data': input_blob.astype(np.float32)}], [{}])
+        res = onnx_test_model.predict([{'data': input_blob.astype(np.float32)}], [{}])
 
         assert np.argmax(res[0]['fc3']) == 7
 
+    def test_infer_with_execution_provider(self, data_dir, models_dir):
+        if old_onnxrunitme(models_dir):
+            pytest.skip(reason="onnxruntime does not support EP")
+        onnx_test_model = get_onnx_test_model(models_dir, ep=['CPUExecutionProvider'])
+        _, _, h, w = onnx_test_model.inputs['data']
+        img_raw = cv2.imread(str(data_dir / '1.jpg'))
+        img_rgb = cv2.cvtColor(img_raw, cv2.COLOR_BGR2RGB)
+        img_resized = cv2.resize(img_rgb, (w, h))
+        input_blob = np.transpose([img_resized], (0, 3, 1, 2))
+        res = onnx_test_model.predict([{'data': input_blob.astype(np.float32)}], [{}])
+
 
 @pytest.mark.usefixtures('mock_path_exists')
 class TestONNXRuntimeLauncherConfig:
diff --git a/tools/accuracy_checker/tests/test_preprocessor.py b/tools/accuracy_checker/tests/test_preprocessor.py
index 19d88326078..6b921908928 100644
--- a/tools/accuracy_checker/tests/test_preprocessor.py
+++ b/tools/accuracy_checker/tests/test_preprocessor.py
@@ -32,7 +32,7 @@
     GeometricOperationMetadata
 )
 from accuracy_checker.preprocessor.preprocessing_executor import PreprocessingExecutor
-from accuracy_checker.preprocessor.geometric_transformations import _OpenCVResizer
+from accuracy_checker.preprocessor.resize import _OpenCVResizer
 from accuracy_checker.data_readers import DataRepresentation
 
 
@@ -47,7 +47,7 @@ def test_default_resize(self, mocker):
         assert resize.dst_width == 200
         assert resize.dst_height == 200
         cv2_resize_mock.assert_called_once_with(
-            input_mock, (200, 200), interpolation=_OpenCVResizer.supported_interpolations['LINEAR']
+            input_mock, (200, 200), interpolation=_OpenCVResizer.supported_interpolations()['LINEAR']
         )
 
     def test_custom_resize(self, mocker):
@@ -65,7 +65,7 @@ def test_custom_resize(self, mocker):
         assert resize.dst_height == 128
         cv2_resize_mock.assert_called_once_with(
             input_mock, (126, 128),
-            interpolation=_OpenCVResizer.supported_interpolations['CUBIC']
+            interpolation=_OpenCVResizer.supported_interpolations()['CUBIC']
         )
 
     def test_resize_without_save_aspect_ratio(self):
@@ -186,7 +186,8 @@ def test_resize_provided_only_dst_width_raise_config_error(self):
 class TestAutoResize:
     def test_default_auto_resize(self, mocker):
         cv2_resize_mock = mocker.patch('accuracy_checker.preprocessor.geometric_transformations.cv2.resize')
-        resize = Preprocessor.provide('auto_resize', {'type': 'auto_resize'}, input_shapes={'data': [1, 3, 200, 200]})
+        resize = Preprocessor.provide('auto_resize', {'type': 'auto_resize'})
+        resize.set_input_shape({'data': (1, 3, 200, 200)})
 
         input_mock = mocker.Mock()
         resize(DataRepresentation(input_mock))
@@ -195,20 +196,19 @@ def test_default_auto_resize(self, mocker):
         assert resize.dst_height == 200
         cv2_resize_mock.assert_called_once_with(input_mock, (200, 200))
 
-    def test_auto_resize_input_shape_not_provided_raise_config_error(self):
+    def test_auto_resize_input_shape_not_provided_raise_config_error(self, mocker):
+        input_mock = mocker.Mock()
         with pytest.raises(ConfigError):
-            Preprocessor.provide('auto_resize', {'type': 'auto_resize'})
+            Preprocessor.provide('auto_resize', {'type': 'auto_resize'})(DataRepresentation(input_mock))
 
     def test_auto_resize_with_several_input_shapes_raise_config_error(self):
         with pytest.raises(ConfigError):
-            Preprocessor.provide(
-                'auto_resize', {'type': 'auto_resize'},
-                input_shapes={'data': [1, 3, 200, 200], 'data2': [1, 3, 300, 300]}
-            )
+            Preprocessor.provide('auto_resize', {'type': 'auto_resize'}).set_input_shape({'data': [1, 3, 200, 200], 'data2': [1, 3, 300, 300]})
+
 
     def test_auto_resize_empty_input_shapes_raise_config_error(self):
         with pytest.raises(ConfigError):
-            Preprocessor.provide('auto_resize', {'type': 'auto_resize'}, input_shapes={})
+            Preprocessor.provide('auto_resize', {'type': 'auto_resize'}).set_input_shape({})
 
 
 class TestNormalization:
@@ -697,9 +697,7 @@ def test_resize_raise_config_error_on_extra_args(self):
 
     def test_auto_resize_raise_config_error_on_extra_args(self):
         with pytest.raises(ConfigError):
-            Preprocessor.provide('auto_resize', {'type': 'auto_resize', 'something_extra': 'extra'},
-                                 input_shapes={'data': [1, 3, 200, 200]}
-                                 )
+            Preprocessor.provide('auto_resize', {'type': 'auto_resize', 'something_extra': 'extra'},)
 
     def test_normalization_raise_config_error_on_extra_args(self):
         with pytest.raises(ConfigError):
diff --git a/tools/accuracy_checker/tests/test_presenter.py b/tools/accuracy_checker/tests/test_presenter.py
index 4d2b5d4f501..76deb176b1f 100644
--- a/tools/accuracy_checker/tests/test_presenter.py
+++ b/tools/accuracy_checker/tests/test_presenter.py
@@ -28,7 +28,7 @@ def test_config_default_presenter(self):
         predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
         config = [{'type': 'accuracy', 'top_k': 1}]
         dispatcher = MetricsExecutor(config, None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for presenter, _ in dispatcher.iterate_metrics(annotations, predictions):
             assert isinstance(presenter, ScalarPrintPresenter)
@@ -38,7 +38,7 @@ def test_config_scalar_presenter(self):
         predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
         config = [{'type': 'accuracy', 'top_k': 1, 'presenter': 'print_scalar'}]
         dispatcher = MetricsExecutor(config, None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for presenter, _ in dispatcher.iterate_metrics(annotations, predictions):
             assert isinstance(presenter, ScalarPrintPresenter)
@@ -48,7 +48,7 @@ def test_config_vector_presenter(self):
         predictions = [ClassificationPrediction('identifier', [1.0, 1.0, 1.0, 4.0])]
         config = [{'type': 'accuracy', 'top_k': 1, 'presenter': 'print_vector'}]
         dispatcher = MetricsExecutor(config, None)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for presenter, _ in dispatcher.iterate_metrics(annotations, predictions):
             assert isinstance(presenter, VectorPrintPresenter)
diff --git a/tools/accuracy_checker/tests/test_pytorch_launcher.py b/tools/accuracy_checker/tests/test_pytorch_launcher.py
new file mode 100644
index 00000000000..788bf7497fd
--- /dev/null
+++ b/tools/accuracy_checker/tests/test_pytorch_launcher.py
@@ -0,0 +1,62 @@
+"""
+Copyright (c) 2019 Intel Corporation
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import pytest
+pytest.importorskip('torch')
+import cv2
+import numpy as np
+
+from accuracy_checker.launcher.launcher import create_launcher
+from accuracy_checker.config import ConfigError
+
+def get_pth_test_model(models_dir):
+    config = {
+        "framework": 'pytorch',
+        "module": 'samplenet.SampLeNet',
+        "checkpoint": models_dir/'pytorch_model'/'samplenet.pth',
+        'python_path': models_dir/'pytorch_model',
+        "adapter": 'classification',
+        "device": 'cpu',
+    }
+
+    return create_launcher(config)
+
+
+class TestPytorchLauncher:
+    def test_launcher_creates(self, models_dir):
+        launcher = get_pth_test_model(models_dir)
+        assert launcher.inputs['input'] == (1, -1, -1, -1)
+        assert launcher.output_blob == 'output'
+
+    def test_infer(self, data_dir, models_dir):
+        pytorch_test_model = get_pth_test_model(models_dir)
+        img_raw = cv2.imread(str(data_dir / '1.jpg'))
+        img_resized = cv2.resize(img_raw, (32, 32))
+        rgb_image = cv2.cvtColor(img_resized, cv2.COLOR_BGR2RGB)
+        input_blob = pytorch_test_model.fit_to_input([rgb_image], 'input', (0, 3, 1, 2))
+
+        res = pytorch_test_model.predict([{'input': input_blob}], [{}])
+
+        assert np.argmax(res[0]['output']) == 5
+
+
+@pytest.mark.usefixtures('mock_path_exists')
+class TestMxNetLauncherConfig:
+    def test_missed_model_in_create_pytoch_launcher_raises_config_error_exception(self):
+        config = {'framework': 'pytorch'}
+
+        with pytest.raises(ConfigError):
+            create_launcher(config)
diff --git a/tools/accuracy_checker/tests/test_regression_metrics.py b/tools/accuracy_checker/tests/test_regression_metrics.py
index 5e478043497..c085e9b521a 100644
--- a/tools/accuracy_checker/tests/test_regression_metrics.py
+++ b/tools/accuracy_checker/tests/test_regression_metrics.py
@@ -15,8 +15,11 @@
 """
 
 import pytest
+import numpy as np
 from accuracy_checker.metrics import MetricsExecutor
-from accuracy_checker.representation import RegressionPrediction, RegressionAnnotation
+from accuracy_checker.representation import (
+    RegressionPrediction, RegressionAnnotation, FacialLandmarksAnnotation, FacialLandmarksPrediction
+)
 from accuracy_checker.presenters import EvaluationResult
 
 
@@ -34,11 +37,11 @@ def test_mae_with_zero_diff_between_annotation_and_prediction(self):
             'mae',
             'mae',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -53,11 +56,11 @@ def test_mae_with_negative_diff_between_annotation_and_prediction(self):
             'mae',
             'mae',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -72,11 +75,11 @@ def test_mae_with_positive_diff_between_annotation_and_prediction(self):
             'mae',
             'mae',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -91,11 +94,11 @@ def test_mse_with_zero_diff_between_annotation_and_prediction(self):
             'mse',
             'mse',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -110,11 +113,11 @@ def test_mse_with_negative_diff_between_annotation_and_prediction(self):
             'mse',
             'mse',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -129,11 +132,11 @@ def test_mse_with_positive_diff_between_annotation_and_prediction(self):
             'mse',
             'mse',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean', 'std'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -153,11 +156,11 @@ def test_mae_on_interval_default_all_missed(self):
             'mae_on_interval',
             'mae_on_interval',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': [], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': [], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         with pytest.warns(UserWarning) as warnings:
             for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
@@ -177,13 +180,14 @@ def test_mae_on_interval_default_all_not_in_range_not_ignore_out_of_range(self):
                 'postfix': ' ',
                 'scale': 1,
                 'names': ['mean: < 0.0', 'std: < 0.0', 'mean: > 1.0', 'std: > 1.0'],
-                'calculate_mean': False
+                'calculate_mean': False,
+                'target': 'higher-worse'
             }
         )
         config = [{'type': 'mae_on_interval', 'end': 1, 'ignore_values_not_in_interval': False}]
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -198,11 +202,11 @@ def test_mae_on_interval_values_in_range(self):
             'mae_on_interval',
             'mae_on_interval',
             None,
-            {'postfix': ' ', 'scale': 1, 'names': ['mean: <= 0.0 < 1.0', 'std: <= 0.0 < 1.0'], 'calculate_mean': False}
+            {'postfix': ' ', 'scale': 1, 'names': ['mean: <= 0.0 < 1.0', 'std: <= 0.0 < 1.0'], 'calculate_mean': False, 'target': 'higher-worse'}
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -236,12 +240,13 @@ def test_mae_on_interval_default_not_ignore_out_of_range(self):
                     'mean: > 1.0',
                     'std: > 1.0'
                 ],
-                'calculate_mean': False
+                'calculate_mean': False,
+                'target': 'higher-worse'
             }
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -268,12 +273,13 @@ def test_mae_on_interval_with_given_interval(self):
                 'postfix': ' ',
                 'scale': 1,
                 'names': ['mean: <= 0.0 < 2.0', 'std: <= 0.0 < 2.0', 'mean: <= 2.0 < 4.0', 'std: <= 2.0 < 4.0'],
-                'calculate_mean': False
+                'calculate_mean': False,
+                'target': 'higher-worse'
             }
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -300,12 +306,13 @@ def test_mae_on_interval_with_repeated_values(self):
                 'postfix': ' ',
                 'scale': 1,
                 'names': ['mean: <= 0.0 < 2.0', 'std: <= 0.0 < 2.0', 'mean: <= 2.0 < 4.0', 'std: <= 2.0 < 4.0'],
-                'calculate_mean': False
+                'calculate_mean': False,
+                'target': 'higher-worse'
             }
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -331,12 +338,95 @@ def test_mae_on_interval_with_unsorted_values(self):
             {
                 'postfix': ' ', 'scale': 1,
                 'names': ['mean: <= 0.0 < 2.0', 'std: <= 0.0 < 2.0', 'mean: <= 2.0 < 4.0', 'std: <= 2.0 < 4.0'],
-                'calculate_mean': False
+                'calculate_mean': False,
+                'target': 'higher-worse'
             }
         )
         dispatcher = MetricsExecutor(config, None)
 
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
 
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
+
+
+class TestUpdateRegressionMetrics:
+    def test_update_mae_metric_result(self):
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        config = [{'type': 'mae'}]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 2
+        assert metric_result[1][0].result == 4
+
+    def test_update_mse_metric_result(self):
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        config = [{'type': 'mse'}]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 4
+        assert metric_result[1][0].result == 16
+
+    def test_update_rmse_metric_result(self):
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        config = [{'type': 'rmse'}]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 2
+        assert metric_result[1][0].result == 4
+
+    def test_update_mae_on_interval_metric(self):
+        config = [{'type': 'mae_on_interval', 'intervals': [0.0, 2.0, 4.0]}]
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 2
+        assert metric_result[1][0].result == 4
+
+    def test_update_mse_on_interval_metric(self):
+        config = [{'type': 'mse_on_interval', 'intervals': [0.0, 2.0, 4.0]}]
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 4
+        assert metric_result[1][0].result == 16
+
+    def test_update_rmse_on_interval_metric(self):
+        config = [{'type': 'rmse_on_interval', 'intervals': [0.0, 2.0, 4.0]}]
+        annotations = [RegressionAnnotation('identifier', 3), RegressionAnnotation('identifier2', 1)]
+        predictions = [RegressionPrediction('identifier', 5), RegressionPrediction('identifier2', 5)]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 2
+        assert metric_result[1][0].result == 4
+
+    def test_update_per_point_normed_error(self):
+        config = [{'type': 'per_point_normed_error'}]
+        annotations = [FacialLandmarksAnnotation('identifier', np.array([1, 1, 1, 1, 1]), np.array([1, 1, 1, 1, 1]))]
+        annotations[0].metadata.update({'left_eye': 0, 'right_eye': 1})
+        predictions = [FacialLandmarksPrediction('identifier', np.array([1, 1, 1, 1, 1]), np.array([1, 1, 1, 1, 1]))]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert np.equal(metric_result[0][0].result.all(), np.zeros(5).all())
+
+    def test_update_normed_error(self):
+        config = [{'type': 'normed_error'}]
+        annotations = [FacialLandmarksAnnotation('identifier', np.array([1, 1, 1, 1, 1]), np.array([1, 1, 1, 1, 1]))]
+        annotations[0].metadata.update({'left_eye': 0, 'right_eye': 1})
+        predictions = [FacialLandmarksPrediction('identifier', np.array([1, 1, 1, 1, 1]), np.array([1, 1, 1, 1, 1]))]
+        dispatcher = MetricsExecutor(config, None)
+
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 0
diff --git a/tools/accuracy_checker/tests/test_segmentation_metrics.py b/tools/accuracy_checker/tests/test_segmentation_metrics.py
index 56e13b660af..394ffcac0c8 100644
--- a/tools/accuracy_checker/tests/test_segmentation_metrics.py
+++ b/tools/accuracy_checker/tests/test_segmentation_metrics.py
@@ -26,7 +26,9 @@ def create_config(metric_name, use_argmax=False):
 
 
 def generate_expected_result(values, metric_name, labels=None):
-    meta = {'names': list(labels.values())} if labels else {}
+    meta = {'target': 'higher-better'}
+    if labels:
+        meta.update({'names': list(labels.values())})
 
     return EvaluationResult(pytest.approx(values), None, metric_name, metric_name, None, meta)
 
@@ -38,16 +40,23 @@ def test_one_class(self):
         annotations = make_segmentation_representation(np.array([[0, 0], [0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[0, 0], [0, 0]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), single_class_dataset())
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result(1.0, self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
+    def test_one_class_update_metric_result(self):
+        annotations = make_segmentation_representation(np.array([[0, 0], [0, 0]]), True)
+        predictions = make_segmentation_representation(np.array([[0, 0], [0, 0]]), False)
+        dispatcher = MetricsExecutor(create_config(self.name), single_class_dataset())
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 1
+
     def test_multi_class_not_matched(self):
         annotations = make_segmentation_representation(np.array([[0, 0, 0, 0, 0], [0, 0, 0, 0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[1, 1, 1, 1, 1], [1, 1, 1, 1, 1]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), multi_class_dataset())
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result(0.0, self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -56,11 +65,18 @@ def test_multi_class(self):
         annotations = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), multi_class_dataset())
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result((5.0+1.0+1.0)/(8.0+1.0+1.0), self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
+    def test_multi_class_update_metric_result(self):
+        annotations = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), True)
+        predictions = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), False)
+        dispatcher = MetricsExecutor(create_config(self.name), multi_class_dataset())
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 0.7
+
 
 class TestMeanAccuracy:
     name = 'mean_accuracy'
@@ -70,8 +86,8 @@ def test_one_class(self):
         predictions = make_segmentation_representation(np.array([[0, 0], [0, 0]]), False)
         dataset = single_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
-        expected = generate_expected_result([1.0, 0.0], self.name, dataset.labels)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected = generate_expected_result([1.0], self.name, {0: dataset.labels[0]})
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
@@ -80,8 +96,8 @@ def test_multi_class_not_matched(self):
         predictions = make_segmentation_representation(np.array([[0, 0, 0, 0, 0], [0, 0, 0, 0, 0]]), False)
         dataset = multi_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
-        expected = generate_expected_result([0.0, 0.0, 0.0, 0.0], self.name, dataset.labels)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected = generate_expected_result([0.0], self.name, {1: dataset.labels[1]})
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
@@ -90,11 +106,20 @@ def test_multi_class(self):
         annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
-        expected = generate_expected_result([1.0, 1.0, 0.0, 0.5], self.name, dataset.labels)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected = generate_expected_result([1.0, 1.0, 0.0, 0.5], self.name, dataset.label_map)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
+    def test_update_metric_result(self):
+        dataset = multi_class_dataset()
+        annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
+        predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
+        dispatcher = MetricsExecutor(create_config(self.name), dataset)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        for class_result, expected_class_result in zip(metric_result[0][0].result, [1.0, 1.0, 0.0, 0.5]):
+            assert class_result == expected_class_result
+
 
 class TestMeanIOU:
     name = 'mean_iou'
@@ -104,8 +129,8 @@ def test_one_class(self):
         predictions = make_segmentation_representation(np.array([[0, 0], [0, 0]]), False)
         dataset = single_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
-        expected = generate_expected_result([1.0, 0.0], self.name, dataset.labels)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected = generate_expected_result([1.0], self.name, {0: dataset.labels[0]})
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
@@ -114,8 +139,8 @@ def test_multi_class_not_matched(self):
         predictions = make_segmentation_representation(np.array([[0, 0, 0, 0, 0], [0, 0, 0, 0, 0]]), False)
         dataset = multi_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
-        expected = generate_expected_result([0.0, 0.0, 0.0, 0.0], self.name, dataset.labels)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        expected = generate_expected_result([0.0, 0.0], self.name, {0: dataset.labels[0], 1: dataset.labels[1]})
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
@@ -124,11 +149,20 @@ def test_multi_class(self):
         annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result([0.625, 1.0, 0.0, 0.5], self.name, dataset.labels)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
 
+    def test_update_metric_result(self):
+        dataset = multi_class_dataset()
+        annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
+        predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
+        dispatcher = MetricsExecutor(create_config(self.name), dataset)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        for class_result, expected_class_result in zip(metric_result[0][0].result, [0.625, 1.0, 0.0, 0.5]):
+            assert class_result == expected_class_result
+
 
 class TestSegmentationFWAcc:
     name = 'frequency_weighted_accuracy'
@@ -138,7 +172,7 @@ def test_one_class(self):
         predictions = make_segmentation_representation(np.array([[0, 0], [0, 0]]), False)
         dataset = single_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result(1.0, self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -148,7 +182,7 @@ def test_multi_class_not_matched(self):
         predictions = make_segmentation_representation(np.array([[0, 0, 0, 0, 0], [0, 0, 0, 0, 0]]), False)
         dataset = multi_class_dataset()
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result(0.0, self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
@@ -158,7 +192,15 @@ def test_multi_class(self):
         annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
         predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
         dispatcher = MetricsExecutor(create_config(self.name), dataset)
-        dispatcher.update_metrics_on_batch(annotations, predictions)
+        dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
         expected = generate_expected_result(0.5125, self.name)
         for _, evaluation_result in dispatcher.iterate_metrics(annotations, predictions):
             assert evaluation_result == expected
+
+    def test_update_metric_result(self):
+        dataset = multi_class_dataset()
+        annotations = make_segmentation_representation(np.array([[1, 2, 3, 2, 3], [0, 0, 0, 0, 0]]), True)
+        predictions = make_segmentation_representation(np.array([[1, 0, 3, 0, 0], [0, 0, 0, 0, 0]]), False)
+        dispatcher = MetricsExecutor(create_config(self.name), dataset)
+        metric_result = dispatcher.update_metrics_on_batch(range(len(annotations)), annotations, predictions)
+        assert metric_result[0][0].result == 0.5125
diff --git a/tools/downloader/README.md b/tools/downloader/README.md
index 5ddf7575456..f999758cc80 100644
--- a/tools/downloader/README.md
+++ b/tools/downloader/README.md
@@ -32,12 +32,31 @@ For the model converter, you will also need to install the OpenVINO&trade;
 toolkit and the prerequisite libraries for Model Optimizer. See the
 [OpenVINO toolkit documentation](https://docs.openvinotoolkit.org/) for details.
 
-If you using models from PyTorch framework, you will also need to use intermediate
-conversion to ONNX format. To use automatic conversion install additional dependencies:
+If you using models from PyTorch or Caffe2 framework, you will also need to use intermediate
+conversion to ONNX format. To use automatic conversion install additional dependencies.
 
+For models from PyTorch:
 ```sh
 python3 -mpip install --user -r ./requirements-pytorch.in
 ```
+For models from Caffe2:
+```sh
+python3 -mpip install --user -r ./requirements-caffe2.in
+```
+
+When running the model downloader with Python 3.5.x on macOS, you may encounter
+an error similar to the following:
+
+> requests.exceptions.SSLError: [...] (Caused by SSLError(SSLError(1, '[SSL: TLSV1_ALERT_PROTOCOL_VERSION]
+tlsv1 alert protocol version (\_ssl.c:719)'),))
+
+You can work around this by installing additional packages:
+
+```sh
+python3 -mpip install --user 'requests[security]'
+```
+
+Alternatively, upgrade to Python 3.6 or a later version.
 
 Model downloader usage
 ----------------------
@@ -199,7 +218,7 @@ The basic usage is to run the script like this:
 ```
 
 This will convert all models into the Inference Engine IR format. Models that
-were originally in that format are ignored. Models in PyTorch's format will be
+were originally in that format are ignored. Models in PyTorch and Caffe2 formats will be
 converted in ONNX format first.
 
 The current directory must be the root of a download tree created by the model
@@ -298,15 +317,25 @@ describing a single model. Each such object has the following keys:
 * `description`: text describing the model. Paragraphs are separated by line feed characters.
 
 * `framework`: a string identifying the framework whose format the model is downloaded in.
-  Current possible values are `dldt` (Inference Engine IR), `caffe`, `mxnet`, `pytorch` and `tf` (TensorFlow).
-  Additional possible values might be added in the future.
+  Current possible values are `dldt` (Inference Engine IR), `caffe`, `caffe2`, `mxnet`, `onnx`,
+  `pytorch` and `tf` (TensorFlow). Additional possible values might be added in the future.
 
 * `license_url`: an URL for the license that the model is distributed under.
 
 * `precisions`: the list of precisions that the model has IR files for. For models downloaded
   in a format other than the Inference Engine IR format, these are the precisions that the model
-  converter can produce IR files in. Current possible values are `FP16`, `FP32`, `INT1`, `INT8`;
-  more might be added in the future.
+  converter can produce IR files in. Current possible values are:
+
+  * `FP16`
+  * `FP16-INT1`
+  * `FP16-INT8`
+  * `FP32`
+  * `FP32-INT1`
+  * `FP32-INT8`
+  * `INT1`
+  * `INT8`
+
+  Additional possible values might be added in the future.
 
 * `subdirectory`: the subdirectory of the output tree into which the downloaded or converted files
   will be placed by the downloader or the converter, respectively.
@@ -318,6 +347,7 @@ describing a single model. Each such object has the following keys:
   * `classification`
   * `detection`
   * `face_recognition`
+  * `feature_extraction`
   * `head_pose_estimation`
   * `human_pose_estimation`
   * `image_processing`
@@ -395,18 +425,6 @@ face-detection-retail-0005
 
 Either `--print_all` or one of the filter options must be specified.
 
-Deprecated options
-------------------
-
-In earlier releases, the tools used a single configuration file instead of
-per-model configuration files. For compatibility, loading such a file is still
-supported. However, this feature is deprecated and will be removed in a future release.
-
-To load a configuration file in the old format, use the `-c`/`--config` option:
-
-```sh
-./TOOL.py --all --config my-config.yml
-```
 __________
 
 OpenVINO is a trademark of Intel Corporation or its subsidiaries in the U.S.
diff --git a/tools/downloader/caffe2_to_onnx.py b/tools/downloader/caffe2_to_onnx.py
new file mode 100644
index 00000000000..0438552a734
--- /dev/null
+++ b/tools/downloader/caffe2_to_onnx.py
@@ -0,0 +1,80 @@
+import argparse
+from pathlib import Path
+import sys
+
+import onnx
+from caffe2.python.onnx.frontend import Caffe2Frontend
+from caffe2.proto import caffe2_pb2
+
+
+def positive_int_arg(values):
+    """Check positive integer type for input argument"""
+    result = []
+    for value in values.split(','):
+        try:
+            ivalue = int(value)
+            if ivalue < 0:
+                raise argparse.ArgumentTypeError('Argument must be a positive integer')
+            result.append(ivalue)
+        except Exception as exc:
+            print(exc)
+            sys.exit('Invalid value for input argument: {!r}, a positive integer is expected'.format(value))
+    return result
+
+def parse_args():
+    """Parse input arguments"""
+
+    parser = argparse.ArgumentParser(description='Conversion of pretrained models from Caffe2 to ONNX')
+
+    parser.add_argument('--model-name', type=str, required=True,
+                        help='Model name to convert.')
+    parser.add_argument('--output-file', type=Path, required=True,
+                        help='Path to the output ONNX model')
+    parser.add_argument('--model-path', type=Path, required=True,
+                        help='Path to predict_net .pb file')
+    parser.add_argument('--weights', type=Path, required=True,
+                        help='Path to init_net .pb file')
+    parser.add_argument('--input-shape', metavar='INPUT_DIM', type=positive_int_arg,
+                        required=True, help='Shape of the input blob')
+    parser.add_argument('--input-names', type=str, required=True,
+                        help='Comma separated names of the input layers')
+
+    return parser.parse_args()
+
+def convert_to_onnx(predict_net_path, init_net_path, input_shape, input_names, output_file, model_name=''):
+    """Convert Caffe2 model to ONNX and check the resulting onnx model"""
+
+    output_file.parent.mkdir(parents=True, exist_ok=True)
+
+    data_type = onnx.TensorProto.FLOAT
+    value_info = {input_names: [data_type, input_shape]}
+
+    predict_net = caffe2_pb2.NetDef()
+    predict_net.ParseFromString(predict_net_path.read_bytes())
+
+    predict_net.name = model_name
+
+    init_net = caffe2_pb2.NetDef()
+    init_net.ParseFromString(init_net_path.read_bytes())
+
+    onnx_model = Caffe2Frontend.caffe2_net_to_onnx_model(
+        predict_net,
+        init_net,
+        value_info
+    )
+    try:
+        onnx.checker.check_model(onnx_model)
+        print('ONNX check passed successfully.')
+        output_file.write_bytes(onnx_model.SerializeToString())
+    except onnx.onnx_cpp2py_export.checker.ValidationError as exc:
+        sys.exit('ONNX check failed with error: ' + str(exc))
+
+def main():
+    args = parse_args()
+    convert_to_onnx(args.model_path, args.weights, args.input_shape,
+        args.input_names, args.output_file, args.model_name
+    )
+
+
+if __name__ == '__main__':
+    main()
diff --git a/tools/downloader/common.py b/tools/downloader/common.py
index 11aae7ec4bf..9441422aa1c 100644
--- a/tools/downloader/common.py
+++ b/tools/downloader/common.py
@@ -29,13 +29,27 @@
 DOWNLOAD_TIMEOUT = 5 * 60
 
 # make sure to update the documentation if you modify these
-KNOWN_FRAMEWORKS = {'caffe', 'dldt', 'mxnet', 'pytorch', 'tf'}
-KNOWN_PRECISIONS = {'FP16', 'FP32', 'INT1', 'INT8'}
+KNOWN_FRAMEWORKS = {
+    'caffe': None,
+    'caffe2': 'caffe2_to_onnx.py',
+    'dldt': None,
+    'mxnet': None,
+    'onnx': None,
+    'pytorch': 'pytorch_to_onnx.py',
+    'tf': None,
+}
+KNOWN_PRECISIONS = {
+    'FP16', 'FP16-INT1', 'FP16-INT8',
+    'FP32', 'FP32-INT1', 'FP32-INT8',
+    'INT1', 'INT8',
+}
 KNOWN_TASK_TYPES = {
     'action_recognition',
     'classification',
+    'colorization',
     'detection',
     'face_recognition',
+    'feature_extraction',
     'head_pose_estimation',
     'human_pose_estimation',
     'image_processing',
@@ -292,7 +306,7 @@ def apply(self, reporter, output_dir):
 
 class Model:
     def __init__(self, name, subdirectory, files, postprocessing, mo_args, framework,
-            description, license_url, precisions, task_type, pytorch_to_onnx_args):
+                 description, license_url, precisions, task_type, conversion_to_onnx_args):
         self.name = name
         self.subdirectory = subdirectory
         self.files = files
@@ -303,7 +317,8 @@ def __init__(self, name, subdirectory, files, postprocessing, mo_args, framework
         self.license_url = license_url
         self.precisions = precisions
         self.task_type = task_type
-        self.pytorch_to_onnx_args = pytorch_to_onnx_args
+        self.conversion_to_onnx_args = conversion_to_onnx_args
+        self.converter_to_onnx = KNOWN_FRAMEWORKS[framework]
 
     @classmethod
     def deserialize(cls, model, name, subdirectory):
@@ -328,12 +343,19 @@ def deserialize(cls, model, name, subdirectory):
                 with deserialization_context('"postprocessing" #{}'.format(i)):
                     postprocessing.append(Postproc.deserialize(postproc))
 
-            pytorch_to_onnx_args = None
-            if model.get('pytorch_to_onnx', None):
-                pytorch_to_onnx_args = [validate_string('"pytorch_to_onnx" #{}'.format(i), arg)
-                                        for i, arg in enumerate(model['pytorch_to_onnx'])]
+            framework = validate_string_enum('"framework"', model['framework'], KNOWN_FRAMEWORKS.keys())
 
-            framework = validate_string_enum('"framework"', model['framework'], KNOWN_FRAMEWORKS)
+            conversion_to_onnx_args = model.get('conversion_to_onnx_args', None)
+            if KNOWN_FRAMEWORKS[framework]:
+                if not conversion_to_onnx_args:
+                    raise DeserializationError('"conversion_to_onnx_args" is absent. '
+                                               'Framework "{}" is supported only by conversion to ONNX.'
+                                               .format(framework))
+                conversion_to_onnx_args = [validate_string('"conversion_to_onnx_args" #{}'.format(i), arg)
+                                           for i, arg in enumerate(model['conversion_to_onnx_args'])]
+            else:
+                if conversion_to_onnx_args:
+                    raise DeserializationError('Conversion to ONNX not supported for "{}" framework'.format(framework))
 
             if 'model_optimizer_args' in model:
                 mo_args = [validate_string('"model_optimizer_args" #{}'.format(i), arg)
@@ -372,51 +394,32 @@ def deserialize(cls, model, name, subdirectory):
             task_type = validate_string_enum('"task_type"', model['task_type'], KNOWN_TASK_TYPES)
 
             return cls(name, subdirectory, files, postprocessing, mo_args, framework,
-                description, license_url, precisions, task_type, pytorch_to_onnx_args)
+                description, license_url, precisions, task_type, conversion_to_onnx_args)
 
 def load_models(args):
     models = []
     model_names = set()
 
-    def add_model(model):
-        models.append(model)
-
-        if models[-1].name in model_names:
-            raise DeserializationError(
-                'Duplicate model name "{}"'.format(models[-1].name))
-        model_names.add(models[-1].name)
+    model_root = (Path(__file__).resolve().parent / '../../models').resolve()
 
-    if args.config is None: # per-model configs
-        model_root = (Path(__file__).resolve().parent / '../../models').resolve()
+    for config_path in sorted(model_root.glob('**/model.yml')):
+        subdirectory = config_path.parent.relative_to(model_root)
 
-        for config_path in sorted(model_root.glob('**/model.yml')):
-            subdirectory = config_path.parent.relative_to(model_root)
+        with config_path.open('rb') as config_file, \
+                deserialization_context('In config "{}"'.format(config_path)):
 
-            with config_path.open('rb') as config_file, \
-                    deserialization_context('In config "{}"'.format(config_path)):
+            model = yaml.safe_load(config_file)
 
-                model = yaml.safe_load(config_file)
+            for bad_key in ['name', 'subdirectory']:
+                if bad_key in model:
+                    raise DeserializationError('Unsupported key "{}"'.format(bad_key))
 
-                for bad_key in ['name', 'subdirectory']:
-                    if bad_key in model:
-                        raise DeserializationError('Unsupported key "{}"'.format(bad_key))
+            models.append(Model.deserialize(model, subdirectory.name, subdirectory))
 
-                add_model(Model.deserialize(model, subdirectory.name, subdirectory))
-
-    else: # monolithic config
-        print('########## Warning: the --config option is deprecated and will be removed in a future release',
-            file=sys.stderr)
-        with args.config.open('rb') as config_file, \
-                deserialization_context('In config "{}"'.format(args.config)):
-            for i, model in enumerate(yaml.safe_load(config_file)['topologies']):
-                with deserialization_context('In model #{}'.format(i)):
-                    name = validate_string('"name"', model['name'])
-                    if not name: raise DeserializationError('"name": must not be empty')
-
-                with deserialization_context('In model "{}"'.format(name)):
-                    subdirectory = validate_relative_path('"output"', model['output'])
-
-                add_model(Model.deserialize(model, name, subdirectory))
+            if models[-1].name in model_names:
+                raise DeserializationError(
+                    'Duplicate model name "{}"'.format(models[-1].name))
+            model_names.add(models[-1].name)
 
     return models
 
diff --git a/tools/downloader/converter.py b/tools/downloader/converter.py
index 0e2f835ebff..6bf091b0ef6 100755
--- a/tools/downloader/converter.py
+++ b/tools/downloader/converter.py
@@ -18,6 +18,7 @@
 import concurrent.futures
 import os
 import platform
+import queue
 import re
 import shlex
 import string
@@ -29,6 +30,53 @@
 
 import common
 
+class JobContext:
+    def printf(self, format, *args, flush=False):
+        raise NotImplementedError
+
+    def subprocess(self, args):
+        raise NotImplementedError
+
+
+class DirectOutputContext(JobContext):
+    def printf(self, format, *args, flush=False):
+        print(format.format(*args), flush=flush)
+
+    def subprocess(self, args):
+        return subprocess.run(args).returncode == 0
+
+
+class QueuedOutputContext(JobContext):
+    def __init__(self, output_queue):
+        self._output_queue = output_queue
+
+    def printf(self, format, *args, flush=False):
+        self._output_queue.put(format.format(*args) + '\n')
+
+    def subprocess(self, args):
+        with subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.STDOUT,
+                universal_newlines=True) as p:
+            for line in p.stdout:
+                self._output_queue.put(line)
+            return p.wait() == 0
+
+
+class JobWithQueuedOutput():
+    def __init__(self, output_queue, future):
+        self._output_queue = output_queue
+        self._future = future
+        self._future.add_done_callback(lambda future: self._output_queue.put(None))
+
+    def complete(self):
+        for fragment in iter(self._output_queue.get, None):
+            print(fragment, end='', flush=True) # for simplicity, flush every fragment
+
+        return self._future.result()
+
+    def cancel(self):
+        self._future.cancel()
+
+
 def quote_windows(arg):
     if not arg: return '""'
     if not re.search(r'\s|"', arg): return arg
@@ -40,34 +88,22 @@ def quote_windows(arg):
 else:
     quote_arg = shlex.quote
 
-def prefixed_printf(prefix, format, *args, **kwargs):
-    if prefix is None:
-        print(format.format(*args), **kwargs)
-    else:
-        print(prefix + ': ' + format.format(*args), **kwargs)
+def convert_to_onnx(context, model, output_dir, args):
+    context.printf('========= {}Converting {} to ONNX',
+                   '(DRY RUN) ' if args.dry_run else '', model.name)
 
-def prefixed_subprocess(prefix, args):
-    if prefix is None:
-        return subprocess.run(args).returncode == 0
+    conversion_to_onnx_args = [string.Template(arg).substitute(conv_dir=output_dir / model.subdirectory,
+                                                               dl_dir=args.download_dir / model.subdirectory)
+                               for arg in model.conversion_to_onnx_args]
+    cmd = [str(args.python), str(Path(__file__).absolute().parent / model.converter_to_onnx), *conversion_to_onnx_args]
 
-    with subprocess.Popen(args, stdout=subprocess.PIPE, stderr=subprocess.STDOUT,
-            universal_newlines=True) as p:
-        for line in p.stdout:
-            sys.stdout.write(prefix + ': ' + line)
-        return p.wait() == 0
+    context.printf('Conversion to ONNX command: {}', ' '.join(map(quote_arg, cmd)))
+    context.printf('')
 
-def convert_to_onnx(model, output_dir, args, stdout_prefix):
-    pytorch_converter = Path(__file__).absolute().parent / 'pytorch_to_onnx.py'
-    prefixed_printf(stdout_prefix, '========= {}Converting {} to ONNX',
-        '(DRY RUN) ' if args.dry_run else '', model.name)
+    success = True if args.dry_run else context.subprocess(cmd)
+    context.printf('')
 
-    pytorch_to_onnx_args = [string.Template(arg).substitute(conv_dir=output_dir / model.subdirectory,
-                                                            dl_dir=args.download_dir / model.subdirectory)
-                            for arg in model.pytorch_to_onnx_args]
-    cmd = [str(args.python), str(pytorch_converter), *pytorch_to_onnx_args]
-    prefixed_printf(stdout_prefix, 'Conversion to ONNX command: {}', ' '.join(map(quote_arg, cmd)))
-
-    return True if args.dry_run else prefixed_subprocess(stdout_prefix, cmd)
+    return success
 
 def num_jobs_arg(value_str):
     if value_str == 'auto':
@@ -83,8 +119,6 @@ def num_jobs_arg(value_str):
 
 def main():
     parser = argparse.ArgumentParser()
-    parser.add_argument('-c', '--config', type=Path, metavar='CONFIG.YML',
-        help='model configuration file (deprecated)')
     parser.add_argument('-d', '--download_dir', type=Path, metavar='DIR',
         default=Path.cwd(), help='root of the directory tree with downloaded model files')
     parser.add_argument('-o', '--output_dir', type=Path, metavar='DIR',
@@ -131,26 +165,22 @@ def main():
 
     output_dir = args.download_dir if args.output_dir is None else args.output_dir
 
-    def convert(model, do_prefix_stdout=True):
-        stdout_prefix = None
-        if do_prefix_stdout:
-            stdout_prefix = threading.current_thread().name
-
+    def convert(context, model):
         if model.mo_args is None:
-            prefixed_printf(stdout_prefix, '========= Skipping {} (no conversions defined)', model.name)
-            prefixed_printf(stdout_prefix, '')
+            context.printf('========= Skipping {} (no conversions defined)', model.name)
+            context.printf('')
             return True
 
         model_precisions = requested_precisions & model.precisions
         if not model_precisions:
-            prefixed_printf(stdout_prefix, '========= Skipping {} (all conversions skipped)', model.name)
-            prefixed_printf(stdout_prefix, '')
+            context.printf('========= Skipping {} (all conversions skipped)', model.name)
+            context.printf('')
             return True
 
         model_format = model.framework
 
-        if model.pytorch_to_onnx_args:
-            if not convert_to_onnx(model, output_dir, args, stdout_prefix):
+        if model.conversion_to_onnx_args:
+            if not convert_to_onnx(context, model, output_dir, args):
                 return False
             model_format = 'onnx'
 
@@ -160,7 +190,7 @@ def convert(model, do_prefix_stdout=True):
                                             conv_dir=output_dir / model.subdirectory)
             for arg in model.mo_args]
 
-        for model_precision in model_precisions:
+        for model_precision in sorted(model_precisions):
             mo_cmd = [str(args.python), '--', str(mo_path),
                 '--framework={}'.format(model_format),
                 '--data_type={}'.format(model_precision),
@@ -168,26 +198,39 @@ def convert(model, do_prefix_stdout=True):
                 '--model_name={}'.format(model.name),
                 *expanded_mo_args, *extra_mo_args]
 
-            prefixed_printf(stdout_prefix, '========= {}Converting {} to IR ({})',
+            context.printf('========= {}Converting {} to IR ({})',
                 '(DRY RUN) ' if args.dry_run else '', model.name, model_precision)
 
-            prefixed_printf(stdout_prefix, 'Conversion command: {}', ' '.join(map(quote_arg, mo_cmd)))
+            context.printf('Conversion command: {}', ' '.join(map(quote_arg, mo_cmd)))
 
             if not args.dry_run:
-                prefixed_printf(stdout_prefix, '', flush=True)
+                context.printf('', flush=True)
 
-                if not prefixed_subprocess(stdout_prefix, mo_cmd):
+                if not context.subprocess(mo_cmd):
                     return False
 
-            prefixed_printf(stdout_prefix, '')
+            context.printf('')
 
         return True
 
     if args.jobs == 1 or args.dry_run:
-        results = [convert(model, do_prefix_stdout=False) for model in models]
+        context = DirectOutputContext()
+        results = [convert(context, model) for model in models]
     else:
         with concurrent.futures.ThreadPoolExecutor(args.jobs) as executor:
-            results = list(executor.map(convert, models))
+            def start(model):
+                output_queue = queue.Queue()
+                return JobWithQueuedOutput(
+                    output_queue,
+                    executor.submit(convert, QueuedOutputContext(output_queue), model))
+
+            jobs = list(map(start, models))
+
+            try:
+                results = [job.complete() for job in jobs]
+            except:
+                for job in jobs: job.cancel()
+                raise
 
     failed_models = [model.name for model, successful in zip(models, results) if not successful]
 
diff --git a/tools/downloader/downloader.py b/tools/downloader/downloader.py
index 67beecbfcb0..afbfc6a3938 100755
--- a/tools/downloader/downloader.py
+++ b/tools/downloader/downloader.py
@@ -36,12 +36,15 @@
 def process_download(reporter, chunk_iterable, size, file):
     start_time = time.monotonic()
     progress_size = 0
+    hasher = hashlib.sha256()
 
     try:
         for chunk in chunk_iterable:
             if chunk:
                 duration = time.monotonic() - start_time
                 progress_size += len(chunk)
+                hasher.update(chunk)
+
                 if duration != 0:
                     speed = int(progress_size / (1024 * duration))
                     percent = str(progress_size * 100 // size)
@@ -51,6 +54,12 @@ def process_download(reporter, chunk_iterable, size, file):
                     reporter.emit_event('model_file_download_progress', size=progress_size)
 
                 file.write(chunk)
+
+                # don't attempt to finish a file if it's bigger than expected
+                if progress_size > size:
+                    break
+
+        return progress_size, hasher.digest()
     finally:
         reporter.end_progress()
 
@@ -65,24 +74,29 @@ def try_download(reporter, file, num_attempts, start_download, size):
             chunk_iterable = start_download()
             file.seek(0)
             file.truncate()
-            process_download(reporter, chunk_iterable, size, file)
-            return True
+            actual_size, hash = process_download(reporter, chunk_iterable, size, file)
+
+            if actual_size > size:
+                reporter.log_error("Remote file is longer than expected ({} B), download aborted", size)
+                # no sense in retrying - if the file is longer, there's no way it'll fix itself
+                return None
+            elif actual_size < size:
+                reporter.log_error("Downloaded file is shorter ({} B) than expected ({} B)",
+                    actual_size, size)
+                # it's possible that we got disconnected before receiving the full file,
+                # so try again
+            else:
+                return hash
         except (requests.exceptions.RequestException, ssl.SSLError):
             reporter.log_error("Download failed", exc_info=True)
 
-    return False
-
-def verify_hash(reporter, file, expected_hash, path, model_name):
-    actual_hash = hashlib.sha256()
-    while True:
-        chunk = file.read(1 << 20)
-        if not chunk: break
-        actual_hash.update(chunk)
+    return None
 
-    if actual_hash.digest() != bytes.fromhex(expected_hash):
+def verify_hash(reporter, actual_hash, expected_hash, path):
+    if actual_hash != bytes.fromhex(expected_hash):
         reporter.log_error('Hash mismatch for "{}"', path)
         reporter.log_details('Expected: {}', expected_hash)
-        reporter.log_details('Actual:   {}', actual_hash.hexdigest())
+        reporter.log_details('Actual:   {}', actual_hash.hex())
         return False
     return True
 
@@ -146,7 +160,7 @@ def try_update_cache(reporter, cache, hash, source):
     except Exception:
         reporter.log_warning('Failed to update the cache', exc_info=True)
 
-def try_retrieve(reporter, name, destination, model_file, cache, num_attempts, start_download):
+def try_retrieve(reporter, destination, model_file, cache, num_attempts, start_download):
     destination.parent.mkdir(parents=True, exist_ok=True)
 
     if try_retrieve_from_cache(reporter, cache, [[model_file.sha256, destination]]):
@@ -157,11 +171,11 @@ def try_retrieve(reporter, name, destination, model_file, cache, num_attempts, s
     success = False
 
     with destination.open('w+b') as f:
-        if try_download(reporter, f, num_attempts, start_download, model_file.size):
-            f.seek(0)
-            if verify_hash(reporter, f, model_file.sha256, destination, name):
-                try_update_cache(reporter, cache, model_file.sha256, destination)
-                success = True
+        actual_hash = try_download(reporter, f, num_attempts, start_download, model_file.size)
+
+    if actual_hash and verify_hash(reporter, actual_hash, model_file.sha256, destination):
+        try_update_cache(reporter, cache, model_file.sha256, destination)
+        success = True
 
     reporter.print()
     return success
@@ -183,8 +197,6 @@ def positive_int_arg(value_str):
 
 def main():
     parser = DownloaderArgumentParser()
-    parser.add_argument('-c', '--config', type=Path, metavar='CONFIG.YML',
-        help='model configuration file (deprecated)')
     parser.add_argument('--name', metavar='PAT[,PAT...]',
         help='download only models whose names match at least one of the specified patterns')
     parser.add_argument('--list', type=Path, metavar='FILE.LST',
@@ -240,7 +252,7 @@ def main():
 
                 destination = output / model_file.name
 
-                if not try_retrieve(model_file_reporter, model.name, destination, model_file, cache, args.num_attempts,
+                if not try_retrieve(model_file_reporter, destination, model_file, cache, args.num_attempts,
                         lambda: model_file.source.start_download(session, CHUNK_SIZE)):
                     shutil.rmtree(str(output))
                     failed_models.add(model.name)
diff --git a/tools/downloader/info_dumper.py b/tools/downloader/info_dumper.py
index 5d6a63bffb0..beb6d981d7a 100755
--- a/tools/downloader/info_dumper.py
+++ b/tools/downloader/info_dumper.py
@@ -36,8 +36,6 @@ def to_info(model):
 
 def main():
     parser = argparse.ArgumentParser()
-    parser.add_argument('-c', '--config', type=Path, metavar='CONFIG.YML',
-        help='model configuration file (deprecated)')
     parser.add_argument('--name', metavar='PAT[,PAT...]',
         help='only dump info for models whose names match at least one of the specified patterns')
     parser.add_argument('--list', type=Path, metavar='FILE.LST',
diff --git a/tools/downloader/license.txt b/tools/downloader/license.txt
deleted file mode 100644
index 29c7e63941b..00000000000
--- a/tools/downloader/license.txt
+++ /dev/null
@@ -1,3992 +0,0 @@
-Configuration file for the automation tools includes following models:
-
-==================================================================================================
-
-* densenet-121, densenet-161, densenet-169, densenet-201 - Densely Connected Convolutional Networks  https://github.com/shicai/DenseNet-Caffe
-
-License terms:
-
-    Copyright (c) 2016, Zhuang Liu.
-    All rights reserved.
-
-    Redistribution and use in source and binary forms, with or without modification,
-    are permitted provided that the following conditions are met:
-
-     * Redistributions of source code must retain the above copyright notice, this
-       list of conditions and the following disclaimer.
-
-     * Redistributions in binary form must reproduce the above copyright notice,
-       this list of conditions and the following disclaimer in the documentation
-       and/or other materials provided with the distribution.
-
-     * Neither the name DenseNet nor the names of its contributors may be used to
-       endorse or promote products derived from this software without specific
-       prior written permission.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-    ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
-    ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-    (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-    LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
-    ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* caffenet - CaffeNet https://arxiv.org/abs/1408.5093
-
-License terms:
-
-    This model is released for unrestricted use.
-
-==================================================================================================
-
-* squeezenet1.0, squeezenet1.1 - SqueezeNet: AlexNet-level accuracy with 50x fewer parameters and $<$0.5MB model size https://github.com/DeepScale/SqueezeNet
-
-License terms:
-
-    BSD LICENSE.
-
-    Redistribution and use in source and binary forms, with or without modification, are permitted
-    provided that the following conditions are met:
-
-    1. Redistributions of source code must retain the above copyright notice, this list of conditions
-    and the following disclaimer.
-
-    2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions
-    and the following disclaimer in the documentation and/or other materials provided with the
-    distribution.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
-    IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
-    FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
-    CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-    DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
-    IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
-    THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* mtcnn-p, mtcnn-r, mtcnn-o - Multi-task Cascaded Convolutional Networks: Proposal, Refine, Output https://github.com/DuinoDu/mtcnn/tree/master/model https://arxiv.org/ftp/arxiv/papers/1604/1604.02878.pdf
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2016 Kaipeng Zhang
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* mask_rcnn_inception_resnet_v2_atrous_coco, mask_rcnn_inception_v2_coco, mask_rcnn_resnet101_atrous_coco, mask_rcnn_resnet50_atrous_coco - Mask R-CNN - https://arxiv.org/pdf/1703.06870.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* mobilenet-ssd – Common object detection architecture https://github.com/chuanqi305/MobileNet-SSD
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2018 chuanqi305
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* ssd_mobilenet_v1_fpn_coco - MobileNetV1 FPN - https://arxiv.org/pdf/1807.03284.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* ssdlite_mobilenet_v2 - MobileNetV2 - https://arxiv.org/pdf/1801.04381.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* vgg16, vgg19 - Very Deep Convolutional Networks For Large-Scale Image Recognition https://arxiv.org/pdf/1409.1556.pdf
-
-License terms:
-
-    Attribution 4.0 International
-
-    =======================================================================
-
-    Creative Commons Corporation ("Creative Commons") is not a law firm and
-    does not provide legal services or legal advice. Distribution of
-    Creative Commons public licenses does not create a lawyer-client or
-    other relationship. Creative Commons makes its licenses and related
-    information available on an "as-is" basis. Creative Commons gives no
-    warranties regarding its licenses, any material licensed under their
-    terms and conditions, or any related information. Creative Commons
-    disclaims all liability for damages resulting from their use to the
-    fullest extent possible.
-
-    Using Creative Commons Public Licenses
-
-    Creative Commons public licenses provide a standard set of terms and
-    conditions that creators and other rights holders may use to share
-    original works of authorship and other material subject to copyright
-    and certain other rights specified in the public license below. The
-    following considerations are for informational purposes only, are not
-    exhaustive, and do not form part of our licenses.
-
-         Considerations for licensors: Our public licenses are
-         intended for use by those authorized to give the public
-         permission to use material in ways otherwise restricted by
-         copyright and certain other rights. Our licenses are
-         irrevocable. Licensors should read and understand the terms
-         and conditions of the license they choose before applying it.
-         Licensors should also secure all rights necessary before
-         applying our licenses so that the public can reuse the
-         material as expected. Licensors should clearly mark any
-         material not subject to the license. This includes other CC-
-         licensed material, or material used under an exception or
-         limitation to copyright. More considerations for licensors:
-        wiki.creativecommons.org/Considerations_for_licensors
-
-         Considerations for the public: By using one of our public
-         licenses, a licensor grants the public permission to use the
-         licensed material under specified terms and conditions. If
-         the licensor's permission is not necessary for any reason--for
-         example, because of any applicable exception or limitation to
-         copyright--then that use is not regulated by the license. Our
-         licenses grant only permissions under copyright and certain
-         other rights that a licensor has authority to grant. Use of
-         the licensed material may still be restricted for other
-         reasons, including because others have copyright or other
-         rights in the material. A licensor may make special requests,
-         such as asking that all changes be marked or described.
-         Although not required by our licenses, you are encouraged to
-         respect those requests where reasonable. More considerations
-         for the public:
-        wiki.creativecommons.org/Considerations_for_licensees
-
-    =======================================================================
-
-    Creative Commons Attribution 4.0 International Public License
-
-    By exercising the Licensed Rights (defined below), You accept and agree
-    to be bound by the terms and conditions of this Creative Commons
-    Attribution 4.0 International Public License ("Public License"). To the
-    extent this Public License may be interpreted as a contract, You are
-    granted the Licensed Rights in consideration of Your acceptance of
-    these terms and conditions, and the Licensor grants You such rights in
-    consideration of benefits the Licensor receives from making the
-    Licensed Material available under these terms and conditions.
-
-
-    Section 1 -- Definitions.
-
-      a. Adapted Material means material subject to Copyright and Similar
-         Rights that is derived from or based upon the Licensed Material
-         and in which the Licensed Material is translated, altered,
-         arranged, transformed, or otherwise modified in a manner requiring
-         permission under the Copyright and Similar Rights held by the
-         Licensor. For purposes of this Public License, where the Licensed
-         Material is a musical work, performance, or sound recording,
-         Adapted Material is always produced where the Licensed Material is
-         synched in timed relation with a moving image.
-
-      b. Adapter's License means the license You apply to Your Copyright
-         and Similar Rights in Your contributions to Adapted Material in
-         accordance with the terms and conditions of this Public License.
-
-      c. Copyright and Similar Rights means copyright and/or similar rights
-         closely related to copyright including, without limitation,
-         performance, broadcast, sound recording, and Sui Generis Database
-         Rights, without regard to how the rights are labeled or
-         categorized. For purposes of this Public License, the rights
-         specified in Section 2(b)(1)-(2) are not Copyright and Similar
-         Rights.
-
-      d. Effective Technological Measures means those measures that, in the
-         absence of proper authority, may not be circumvented under laws
-         fulfilling obligations under Article 11 of the WIPO Copyright
-         Treaty adopted on December 20, 1996, and/or similar international
-         agreements.
-
-      e. Exceptions and Limitations means fair use, fair dealing, and/or
-         any other exception or limitation to Copyright and Similar Rights
-         that applies to Your use of the Licensed Material.
-
-      f. Licensed Material means the artistic or literary work, database,
-         or other material to which the Licensor applied this Public
-         License.
-
-      g. Licensed Rights means the rights granted to You subject to the
-         terms and conditions of this Public License, which are limited to
-         all Copyright and Similar Rights that apply to Your use of the
-         Licensed Material and that the Licensor has authority to license.
-
-      h. Licensor means the individual(s) or entity(ies) granting rights
-         under this Public License.
-
-      i. Share means to provide material to the public by any means or
-         process that requires permission under the Licensed Rights, such
-         as reproduction, public display, public performance, distribution,
-         dissemination, communication, or importation, and to make material
-         available to the public including in ways that members of the
-         public may access the material from a place and at a time
-         individually chosen by them.
-
-      j. Sui Generis Database Rights means rights other than copyright
-         resulting from Directive 96/9/EC of the European Parliament and of
-         the Council of 11 March 1996 on the legal protection of databases,
-         as amended and/or succeeded, as well as other essentially
-         equivalent rights anywhere in the world.
-
-      k. You means the individual or entity exercising the Licensed Rights
-         under this Public License. Your has a corresponding meaning.
-
-
-    Section 2 -- Scope.
-
-      a. License grant.
-
-           1. Subject to the terms and conditions of this Public License,
-              the Licensor hereby grants You a worldwide, royalty-free,
-              non-sublicensable, non-exclusive, irrevocable license to
-              exercise the Licensed Rights in the Licensed Material to:
-
-                a. reproduce and Share the Licensed Material, in whole or
-                   in part; and
-
-                b. produce, reproduce, and Share Adapted Material.
-
-           2. Exceptions and Limitations. For the avoidance of doubt, where
-              Exceptions and Limitations apply to Your use, this Public
-              License does not apply, and You do not need to comply with
-              its terms and conditions.
-
-           3. Term. The term of this Public License is specified in Section
-              6(a).
-
-           4. Media and formats; technical modifications allowed. The
-              Licensor authorizes You to exercise the Licensed Rights in
-              all media and formats whether now known or hereafter created,
-              and to make technical modifications necessary to do so. The
-              Licensor waives and/or agrees not to assert any right or
-              authority to forbid You from making technical modifications
-              necessary to exercise the Licensed Rights, including
-              technical modifications necessary to circumvent Effective
-              Technological Measures. For purposes of this Public License,
-              simply making modifications authorized by this Section 2(a)
-              (4) never produces Adapted Material.
-
-           5. Downstream recipients.
-
-                a. Offer from the Licensor -- Licensed Material. Every
-                   recipient of the Licensed Material automatically
-                   receives an offer from the Licensor to exercise the
-                   Licensed Rights under the terms and conditions of this
-                   Public License.
-
-                b. No downstream restrictions. You may not offer or impose
-                   any additional or different terms or conditions on, or
-                   apply any Effective Technological Measures to, the
-                   Licensed Material if doing so restricts exercise of the
-                   Licensed Rights by any recipient of the Licensed
-                   Material.
-
-           6. No endorsement. Nothing in this Public License constitutes or
-              may be construed as permission to assert or imply that You
-              are, or that Your use of the Licensed Material is, connected
-              with, or sponsored, endorsed, or granted official status by,
-              the Licensor or others designated to receive attribution as
-              provided in Section 3(a)(1)(A)(i).
-
-      b. Other rights.
-
-           1. Moral rights, such as the right of integrity, are not
-              licensed under this Public License, nor are publicity,
-              privacy, and/or other similar personality rights; however, to
-              the extent possible, the Licensor waives and/or agrees not to
-              assert any such rights held by the Licensor to the limited
-              extent necessary to allow You to exercise the Licensed
-              Rights, but not otherwise.
-
-           2. Patent and trademark rights are not licensed under this
-              Public License.
-
-           3. To the extent possible, the Licensor waives any right to
-              collect royalties from You for the exercise of the Licensed
-              Rights, whether directly or through a collecting society
-              under any voluntary or waivable statutory or compulsory
-              licensing scheme. In all other cases the Licensor expressly
-              reserves any right to collect such royalties.
-
-
-    Section 3 -- License Conditions.
-
-    Your exercise of the Licensed Rights is expressly made subject to the
-    following conditions.
-
-      a. Attribution.
-
-           1. If You Share the Licensed Material (including in modified
-              form), You must:
-
-                a. retain the following if it is supplied by the Licensor
-                   with the Licensed Material:
-
-                     i. identification of the creator(s) of the Licensed
-                        Material and any others designated to receive
-                        attribution, in any reasonable manner requested by
-                        the Licensor (including by pseudonym if
-                        designated);
-
-                    ii. a copyright notice;
-
-                   iii. a notice that refers to this Public License;
-
-                    iv. a notice that refers to the disclaimer of
-                        warranties;
-
-                     v. a URI or hyperlink to the Licensed Material to the
-                        extent reasonably practicable;
-
-                b. indicate if You modified the Licensed Material and
-                   retain an indication of any previous modifications; and
-
-                c. indicate the Licensed Material is licensed under this
-                   Public License, and include the text of, or the URI or
-                   hyperlink to, this Public License.
-
-           2. You may satisfy the conditions in Section 3(a)(1) in any
-              reasonable manner based on the medium, means, and context in
-              which You Share the Licensed Material. For example, it may be
-              reasonable to satisfy the conditions by providing a URI or
-              hyperlink to a resource that includes the required
-              information.
-
-           3. If requested by the Licensor, You must remove any of the
-              information required by Section 3(a)(1)(A) to the extent
-              reasonably practicable.
-
-           4. If You Share Adapted Material You produce, the Adapter's
-              License You apply must not prevent recipients of the Adapted
-              Material from complying with this Public License.
-
-
-    Section 4 -- Sui Generis Database Rights.
-
-    Where the Licensed Rights include Sui Generis Database Rights that
-    apply to Your use of the Licensed Material:
-
-      a. for the avoidance of doubt, Section 2(a)(1) grants You the right
-         to extract, reuse, reproduce, and Share all or a substantial
-         portion of the contents of the database;
-
-      b. if You include all or a substantial portion of the database
-         contents in a database in which You have Sui Generis Database
-         Rights, then the database in which You have Sui Generis Database
-         Rights (but not its individual contents) is Adapted Material; and
-
-      c. You must comply with the conditions in Section 3(a) if You Share
-         all or a substantial portion of the contents of the database.
-
-    For the avoidance of doubt, this Section 4 supplements and does not
-    replace Your obligations under this Public License where the Licensed
-    Rights include other Copyright and Similar Rights.
-
-
-    Section 5 -- Disclaimer of Warranties and Limitation of Liability.
-
-      a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
-         EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
-         AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
-         ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
-         IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
-         WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
-         PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
-         ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
-         KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
-         ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
-
-      b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
-         TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
-         NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
-         INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
-         COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
-         USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
-         ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
-         DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
-         IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
-
-      c. The disclaimer of warranties and limitation of liability provided
-         above shall be interpreted in a manner that, to the extent
-         possible, most closely approximates an absolute disclaimer and
-         waiver of all liability.
-
-
-    Section 6 -- Term and Termination.
-
-      a. This Public License applies for the term of the Copyright and
-         Similar Rights licensed here. However, if You fail to comply with
-         this Public License, then Your rights under this Public License
-         terminate automatically.
-
-      b. Where Your right to use the Licensed Material has terminated under
-         Section 6(a), it reinstates:
-
-           1. automatically as of the date the violation is cured, provided
-              it is cured within 30 days of Your discovery of the
-              violation; or
-
-           2. upon express reinstatement by the Licensor.
-
-         For the avoidance of doubt, this Section 6(b) does not affect any
-         right the Licensor may have to seek remedies for Your violations
-         of this Public License.
-
-      c. For the avoidance of doubt, the Licensor may also offer the
-         Licensed Material under separate terms or conditions or stop
-         distributing the Licensed Material at any time; however, doing so
-         will not terminate this Public License.
-
-      d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
-         License.
-
-
-    Section 7 -- Other Terms and Conditions.
-
-      a. The Licensor shall not be bound by any additional or different
-         terms or conditions communicated by You unless expressly agreed.
-
-      b. Any arrangements, understandings, or agreements regarding the
-         Licensed Material not stated herein are separate from and
-         independent of the terms and conditions of this Public License.
-
-
-    Section 8 -- Interpretation.
-
-      a. For the avoidance of doubt, this Public License does not, and
-         shall not be interpreted to, reduce, limit, restrict, or impose
-         conditions on any use of the Licensed Material that could lawfully
-         be made without permission under this Public License.
-
-      b. To the extent possible, if any provision of this Public License is
-         deemed unenforceable, it shall be automatically reformed to the
-         minimum extent necessary to make it enforceable. If the provision
-         cannot be reformed, it shall be severed from this Public License
-         without affecting the enforceability of the remaining terms and
-         conditions.
-
-      c. No term or condition of this Public License will be waived and no
-         failure to comply consented to unless expressly agreed to by the
-         Licensor.
-
-      d. Nothing in this Public License constitutes or may be interpreted
-         as a limitation upon, or waiver of, any privileges and immunities
-         that apply to the Licensor or You, including from the legal
-         processes of any jurisdiction or authority.
-
-
-    =======================================================================
-
-    Creative Commons is not a party to its public
-    licenses. Notwithstanding, Creative Commons may elect to apply one of
-    its public licenses to material it publishes and in those instances
-    will be considered the “Licensor.” The text of the Creative Commons
-    public licenses is dedicated to the public domain under the CC0 Public
-    Domain Dedication. Except for the limited purpose of indicating that
-    material is shared under a Creative Commons public license or as
-    otherwise permitted by the Creative Commons policies published at
-    creativecommons.org/policies, Creative Commons does not authorize the
-    use of the trademark "Creative Commons" or any other trademark or logo
-    of Creative Commons without its prior written consent including,
-    without limitation, in connection with any unauthorized modifications
-    to any of its public licenses or any other arrangements,
-    understandings, or agreements concerning use of licensed material. For
-    the avoidance of doubt, this paragraph does not form part of the
-    public licenses.
-
-    Creative Commons may be contacted at creativecommons.org.
-
-==================================================================================================
-
-* ssd300, ssd512 - Single Shot MultiBox Detector https://arxiv.org/pdf/1512.02325.pdf
-
-License terms:
-
-    COPYRIGHT
-
-    All new contributions compared to the original branch:
-    Copyright (c) 2015, 2016 Wei Liu (UNC Chapel Hill), Dragomir Anguelov (Zoox),
-    Dumitru Erhan (Google), Christian Szegedy (Google), Scott Reed (UMich Ann Arbor),
-    Cheng-Yang Fu (UNC Chapel Hill), Alexander C. Berg (UNC Chapel Hill).
-    All rights reserved.
-
-    All contributions by the University of California:
-    Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
-    All rights reserved.
-
-    All other contributions:
-    Copyright (c) 2014, 2015, the respective contributors
-    All rights reserved.
-
-    Caffe uses a shared copyright model: each contributor holds copyright over
-    their contributions to Caffe. The project versioning records all such
-    contribution and copyright details. If a contributor wants to further mark
-    their specific copyright on a particular contribution, they should indicate
-    their copyright solely in the commit message of the change when it is
-    committed.
-
-    LICENSE
-
-    Redistribution and use in source and binary forms, with or without
-    modification, are permitted provided that the following conditions are met:
-
-    1. Redistributions of source code must retain the above copyright notice, this
-       list of conditions and the following disclaimer.
-    2. Redistributions in binary form must reproduce the above copyright notice,
-       this list of conditions and the following disclaimer in the documentation
-       and/or other materials provided with the distribution.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-    ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
-    ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-    (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-    LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-    ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-    CONTRIBUTION AGREEMENT
-
-    By contributing to the BVLC/caffe repository through pull-request, comment,
-    or otherwise, the contributor releases their content to the
-    license and copyright terms herein.
-
-==================================================================================================
-
-* inception-resnet-v2 - Inception-ResNet V2 architecture https://arxiv.org/pdf/1602.07261.pdf
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2017 soeaver Yang
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* inception-resnet-v2-tf - Inception-ResNet V2 architecture https://arxiv.org/pdf/1602.07261.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* googlenet-v1 - GoogleNet v1 - Inception v1 - https://arxiv.org/pdf/1409.4842.pdf
-
-License terms:
-
-    COPYRIGHT
-
-    All contributions by the University of California:
-    Copyright (c) 2014-2017 The Regents of the University of California (Regents)
-    All rights reserved.
-
-    All other contributions:
-    Copyright (c) 2014-2017, the respective contributors
-    All rights reserved.
-
-    Caffe uses a shared copyright model: each contributor holds copyright over
-    their contributions to Caffe. The project versioning records all such
-    contribution and copyright details. If a contributor wants to further mark
-    their specific copyright on a particular contribution, they should indicate
-    their copyright solely in the commit message of the change when it is
-    committed.
-
-    LICENSE
-
-    Redistribution and use in source and binary forms, with or without
-    modification, are permitted provided that the following conditions are met:
-
-    1. Redistributions of source code must retain the above copyright notice, this
-       list of conditions and the following disclaimer.
-    2. Redistributions in binary form must reproduce the above copyright notice,
-       this list of conditions and the following disclaimer in the documentation
-       and/or other materials provided with the distribution.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
-    ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
-    WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
-    ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
-    (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
-    LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
-    ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-    (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* googlenet-v2 - GoogleNet v2 - Inception v2 - https://arxiv.org/pdf/1502.03167.pdf
-
-License terms:
-
-    This model is released for unrestricted use.
-
-==================================================================================================
-
-* googlenet-v4 - GoogleNet v4 - Inception v4
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2017 soeaver Yang
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* alexnet - AlexNet - http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks.pdf
-
-License terms:
-
-    This model is released for unrestricted use.
-
-==================================================================================================
-
-* ssd_mobilenet_v2_coco - MobileNetV2 object detection architecture - https://arxiv.org/pdf/1801.04381.pdf - pre-trained on the COCO dataset
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* resnet-50 - ResNet-50 - https://arxiv.org/pdf/1512.03385.pdf
-
-License terms:
-
-    The MIT License (MIT)
-
-    Copyright (c) 2016 Shaoqing Ren
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* resnet-101, resnet-152 - https://arxiv.org/pdf/1512.03385.pdf
-
-License terms:
-
-    The MIT License (MIT)
-
-    Copyright (c) 2016 Shaoqing Ren
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* googlenet-v3 - GoogleNet v3 - Inception v3 - https://arxiv.org/pdf/1512.00567.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* se-inception - BN-Inception with Squeeze-and-Excitation blocks - https://arxiv.org/pdf/1709.01507.pdf
-
-License terms:
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* se-resnet-50, se-resnet-101, se-resnet-152, se-resnext-50, se-resnext-101 - https://arxiv.org/pdf/1709.01507.pdf
-
-License terms:
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* Sphereface - Deep face recognition under open-set protocol - https://arxiv.org/pdf/1704.08063.pdf
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2017 Weiyang Liu and Yandong Wen
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* mobilenet-v1-1.0-224, MobileNet V1 architecture with the width multiplier 1.0 and resolution 224 - https://arxiv.org/pdf/1704.04861.pdf
-
-License terms:
-
-    BSD 3-Clause License
-
-    Copyright (c) 2017-, Shicai Yang
-    All rights reserved.
-
-    Redistribution and use in source and binary forms, with or without
-    modification, are permitted provided that the following conditions are met:
-
-    * Redistributions of source code must retain the above copyright notice, this
-      list of conditions and the following disclaimer.
-
-    * Redistributions in binary form must reproduce the above copyright notice,
-      this list of conditions and the following disclaimer in the documentation
-      and/or other materials provided with the distribution.
-
-    * Neither the name of the copyright holder nor the names of its
-      contributors may be used to endorse or promote products derived from
-      this software without specific prior written permission.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-    AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-    IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
-    FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
-    SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
-    CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
-    OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* mobilenet-v1-1.0-224-tf - MobileNet V1 architecture with the width multiplier 1.0 and resolution 224 - https://arxiv.org/pdf/1704.04861.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* mobilenet-v2 - MobileNet V2 - https://arxiv.org/pdf/1801.04381.pdf
-
-License terms:
-
-    BSD 3-Clause License
-
-    Copyright (c) 2017-, Shicai Yang
-    All rights reserved.
-
-    Redistribution and use in source and binary forms, with or without
-    modification, are permitted provided that the following conditions are met:
-
-    * Redistributions of source code must retain the above copyright notice, this
-      list of conditions and the following disclaimer.
-
-    * Redistributions in binary form must reproduce the above copyright notice,
-      this list of conditions and the following disclaimer in the documentation
-      and/or other materials provided with the distribution.
-
-    * Neither the name of the copyright holder nor the names of its
-      contributors may be used to endorse or promote products derived from
-      this software without specific prior written permission.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-    AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-    IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
-    FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
-    SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
-    CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
-    OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* faster_rcnn_inception_v2_coco - Faster R-CNN with Inception v2 - https://arxiv.org/pdf/1801.04381.pdf pre-trained on the COCO dataset
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* deeplabv3 - Rethinking Atrous Convolution for Semantic Image Segmentation - https://arxiv.org/pdf/1706.05587.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* ctpn - Detecting Text in Natural Image with Connectionist Text Proposal Network - https://arxiv.org/pdf/1609.03605.pdf
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2017 shaohui ruan
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* ssd_mobilenet_v1_coco - MobileNetV1 object detection architecture - https://arxiv.org/pdf/1807.03284.pdf - pre-trained on the COCO dataset
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* faster_rcnn_resnet101_coco - Faster R-CNN Resnet-101 - https://arxiv.org/pdf/1801.04381.pdf - pre-trained on the COCO dataset
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* mobilenet-v2-1.4-224 - MobileNet V2 architecture with the width multiplier 1.4 and resolution 224 - https://arxiv.org/abs/1801.04381
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* brain-tumor-segmentation-0001 - Cascaded UNet for brain tumor segmentation - https://arxiv.org/abs/1810.04008
-
-License terms:
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* mobilenet-v1-0.50-224, mobilenet-v1-0.50-160, mobilenet-v1-0.25-128 - MobileNet V1 architecture - https://arxiv.org/pdf/1704.04861.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* mobilenet-v2-1.0-224 - MobileNet V2 architecture with the width multiplier 1.0 and resolution 224 - https://arxiv.org/abs/1801.04381
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* faster_rcnn_resnet50_coco, faster_rcnn_inception_resnet_v2_atrous_coco - Faster R-CNN - https://arxiv.org/pdf/1801.04381.pdf
-
-License terms:
-
-    Copyright 2016 The TensorFlow Authors.  All rights reserved.
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright 2016, The Authors.
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* densenet-121-tf, densenet-169-tf, densenet-161-tf - Tensorflow implementation of DenseNet by G. Huang, Z. Liu, K. Weinberger, and L. van der Maaten with ImageNet pretrained models.
-
-License terms:
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "{}"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright {yyyy} {name of copyright owner}
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* facenet-20180408-102900 - FaceNet: A Unified Embedding for Face Recognition and Clustering trained on CASIA-WebFace dataset - https://arxiv.org/pdf/1503.03832.pdf
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2016 David Sandberg
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* face-detection-retail-0044
-
-License terms:
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright [yyyy] [name of copyright owner]
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* license-plate-recognition-barrier-0007
-
-License terms:
-
-    Apache License
-    Version 2.0, January 2004
-    http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-    "License" shall mean the terms and conditions for use, reproduction,
-    and distribution as defined by Sections 1 through 9 of this document.
-
-    "Licensor" shall mean the copyright owner or entity authorized by
-    the copyright owner that is granting the License.
-
-    "Legal Entity" shall mean the union of the acting entity and all
-    other entities that control, are controlled by, or are under common
-    control with that entity. For the purposes of this definition,
-    "control" means (i) the power, direct or indirect, to cause the
-    direction or management of such entity, whether by contract or
-    otherwise, or (ii) ownership of fifty percent (50%) or more of the
-    outstanding shares, or (iii) beneficial ownership of such entity.
-
-    "You" (or "Your") shall mean an individual or Legal Entity
-    exercising permissions granted by this License.
-
-    "Source" form shall mean the preferred form for making modifications,
-    including but not limited to software source code, documentation
-    source, and configuration files.
-
-    "Object" form shall mean any form resulting from mechanical
-    transformation or translation of a Source form, including but
-    not limited to compiled object code, generated documentation,
-    and conversions to other media types.
-
-    "Work" shall mean the work of authorship, whether in Source or
-    Object form, made available under the License, as indicated by a
-    copyright notice that is included in or attached to the work
-    (an example is provided in the Appendix below).
-
-    "Derivative Works" shall mean any work, whether in Source or Object
-    form, that is based on (or derived from) the Work and for which the
-    editorial revisions, annotations, elaborations, or other modifications
-    represent, as a whole, an original work of authorship. For the purposes
-    of this License, Derivative Works shall not include works that remain
-    separable from, or merely link (or bind by name) to the interfaces of,
-    the Work and Derivative Works thereof.
-
-    "Contribution" shall mean any work of authorship, including
-    the original version of the Work and any modifications or additions
-    to that Work or Derivative Works thereof, that is intentionally
-    submitted to Licensor for inclusion in the Work by the copyright owner
-    or by an individual or Legal Entity authorized to submit on behalf of
-    the copyright owner. For the purposes of this definition, "submitted"
-    means any form of electronic, verbal, or written communication sent
-    to the Licensor or its representatives, including but not limited to
-    communication on electronic mailing lists, source code control systems,
-    and issue tracking systems that are managed by, or on behalf of, the
-    Licensor for the purpose of discussing and improving the Work, but
-    excluding communication that is conspicuously marked or otherwise
-    designated in writing by the copyright owner as "Not a Contribution."
-
-    "Contributor" shall mean Licensor and any individual or Legal Entity
-    on behalf of whom a Contribution has been received by Licensor and
-    subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    copyright license to reproduce, prepare Derivative Works of,
-    publicly display, publicly perform, sublicense, and distribute the
-    Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    (except as stated in this section) patent license to make, have made,
-    use, offer to sell, sell, import, and otherwise transfer the Work,
-    where such license applies only to those patent claims licensable
-    by such Contributor that are necessarily infringed by their
-    Contribution(s) alone or by combination of their Contribution(s)
-    with the Work to which such Contribution(s) was submitted. If You
-    institute patent litigation against any entity (including a
-    cross-claim or counterclaim in a lawsuit) alleging that the Work
-    or a Contribution incorporated within the Work constitutes direct
-    or contributory patent infringement, then any patent licenses
-    granted to You under this License for that Work shall terminate
-    as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-    Work or Derivative Works thereof in any medium, with or without
-    modifications, and in Source or Object form, provided that You
-    meet the following conditions:
-
-    (a) You must give any other recipients of the Work or
-    Derivative Works a copy of this License; and
-
-    (b) You must cause any modified files to carry prominent notices
-    stating that You changed the files; and
-
-    (c) You must retain, in the Source form of any Derivative Works
-    that You distribute, all copyright, patent, trademark, and
-    attribution notices from the Source form of the Work,
-    excluding those notices that do not pertain to any part of
-    the Derivative Works; and
-
-    (d) If the Work includes a "NOTICE" text file as part of its
-    distribution, then any Derivative Works that You distribute must
-    include a readable copy of the attribution notices contained
-    within such NOTICE file, excluding those notices that do not
-    pertain to any part of the Derivative Works, in at least one
-    of the following places: within a NOTICE text file distributed
-    as part of the Derivative Works; within the Source form or
-    documentation, if provided along with the Derivative Works; or,
-    within a display generated by the Derivative Works, if and
-    wherever such third-party notices normally appear. The contents
-    of the NOTICE file are for informational purposes only and
-    do not modify the License. You may add Your own attribution
-    notices within Derivative Works that You distribute, alongside
-    or as an addendum to the NOTICE text from the Work, provided
-    that such additional attribution notices cannot be construed
-    as modifying the License.
-
-    You may add Your own copyright statement to Your modifications and
-    may provide additional or different license terms and conditions
-    for use, reproduction, or distribution of Your modifications, or
-    for any such Derivative Works as a whole, provided Your use,
-    reproduction, and distribution of the Work otherwise complies with
-    the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-    any Contribution intentionally submitted for inclusion in the Work
-    by You to the Licensor shall be under the terms and conditions of
-    this License, without any additional terms or conditions.
-    Notwithstanding the above, nothing herein shall supersede or modify
-    the terms of any separate license agreement you may have executed
-    with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-    names, trademarks, service marks, or product names of the Licensor,
-    except as required for reasonable and customary use in describing the
-    origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-    agreed to in writing, Licensor provides the Work (and each
-    Contributor provides its Contributions) on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-    implied, including, without limitation, any warranties or conditions
-    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-    PARTICULAR PURPOSE. You are solely responsible for determining the
-    appropriateness of using or redistributing the Work and assume any
-    risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-    whether in tort (including negligence), contract, or otherwise,
-    unless required by applicable law (such as deliberate and grossly
-    negligent acts) or agreed to in writing, shall any Contributor be
-    liable to You for damages, including any direct, indirect, special,
-    incidental, or consequential damages of any character arising as a
-    result of this License or out of the use or inability to use the
-    Work (including but not limited to damages for loss of goodwill,
-    work stoppage, computer failure or malfunction, or any and all
-    other commercial damages or losses), even if such Contributor
-    has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-    the Work or Derivative Works thereof, You may choose to offer,
-    and charge a fee for, acceptance of support, warranty, indemnity,
-    or other liability obligations and/or rights consistent with this
-    License. However, in accepting such obligations, You may act only
-    on Your own behalf and on Your sole responsibility, not on behalf
-    of any other Contributor, and only if You agree to indemnify,
-    defend, and hold each Contributor harmless for any liability
-    incurred by, or claims asserted against, such Contributor by reason
-    of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-    To apply the Apache License to your work, attach the following
-    boilerplate notice, with the fields enclosed by brackets "[]"
-    replaced with your own identifying information. (Don't include
-    the brackets!)  The text should be enclosed in the appropriate
-    comment syntax for the file format. We also recommend that a
-    file or class name and description of purpose be included on the
-    same "printed page" as the copyright notice for easier
-    identification within third-party archives.
-
-    Copyright [yyyy] [name of copyright owner]
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* action-recognition-0001-decoder
-* action-recognition-0001-encoder
-* age-gender-recognition-retail-0013
-* driver-action-recognition-adas-0002-decoder
-* driver-action-recognition-adas-0002-encoder
-* emotions-recognition-retail-0003
-* face-detection-adas-0001
-* face-detection-adas-binary-0001
-* face-detection-retail-0004
-* face-detection-retail-0005
-* face-reidentification-retail-0095
-* facial-landmarks-35-adas-0002
-* gaze-estimation-adas-0002
-* handwritten-score-recognition-0003
-* head-pose-estimation-adas-0001
-* human-pose-estimation-0001
-* inceptionv3-int8-sparse-v1-tf-0001
-* inceptionv3-int8-sparse-v2-tf-0001
-* inceptionv3-int8-tf-0001
-* instance-segmentation-security-0010
-* instance-segmentation-security-0050
-* instance-segmentation-security-0083
-* landmarks-regression-retail-0009
-* license-plate-recognition-barrier-0001
-* mobilenet-v2-pytorch
-* mobilenetv2-int8-sparse-v1-tf-0001
-* mobilenetv2-int8-sparse-v2-tf-0001
-* mobilenetv2-int8-tf-0001
-* pedestrian-and-vehicle-detector-adas-0001
-* pedestrian-detection-adas-0002
-* pedestrian-detection-adas-binary-0001
-* person-attributes-recognition-crossroad-0230
-* person-detection-action-recognition-0005
-* person-detection-action-recognition-0006
-* person-detection-action-recognition-teacher-0002
-* person-detection-raisinghand-recognition-0001
-* person-detection-retail-0002
-* person-detection-retail-0013
-* person-reidentification-retail-0031
-* person-reidentification-retail-0076
-* person-reidentification-retail-0079
-* person-vehicle-bike-detection-crossroad-0078
-* person-vehicle-bike-detection-crossroad-1016
-* resnet-50-int8-sparse-v1-tf-0001
-* resnet-50-int8-sparse-v2-tf-0001
-* resnet-50-int8-tf-0001
-* resnet50-binary-0001
-* road-segmentation-adas-0001
-* semantic-segmentation-adas-0001
-* single-image-super-resolution-1032
-* single-image-super-resolution-1033
-* text-detection-0003
-* text-detection-0004
-* text-image-super-resolution-0001
-* text-recognition-0012
-* vehicle-attributes-recognition-barrier-0039
-* vehicle-detection-adas-0002
-* vehicle-detection-adas-binary-0001
-* vehicle-license-plate-detection-barrier-0106
-
-License terms:
-
-                                  Apache License
-                            Version 2.0, January 2004
-                         http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-       "License" shall mean the terms and conditions for use, reproduction,
-       and distribution as defined by Sections 1 through 9 of this document.
-
-       "Licensor" shall mean the copyright owner or entity authorized by
-       the copyright owner that is granting the License.
-
-       "Legal Entity" shall mean the union of the acting entity and all
-       other entities that control, are controlled by, or are under common
-       control with that entity. For the purposes of this definition,
-       "control" means (i) the power, direct or indirect, to cause the
-       direction or management of such entity, whether by contract or
-       otherwise, or (ii) ownership of fifty percent (50%) or more of the
-       outstanding shares, or (iii) beneficial ownership of such entity.
-
-       "You" (or "Your") shall mean an individual or Legal Entity
-       exercising permissions granted by this License.
-
-       "Source" form shall mean the preferred form for making modifications,
-       including but not limited to software source code, documentation
-       source, and configuration files.
-
-       "Object" form shall mean any form resulting from mechanical
-       transformation or translation of a Source form, including but
-       not limited to compiled object code, generated documentation,
-       and conversions to other media types.
-
-       "Work" shall mean the work of authorship, whether in Source or
-       Object form, made available under the License, as indicated by a
-       copyright notice that is included in or attached to the work
-       (an example is provided in the Appendix below).
-
-       "Derivative Works" shall mean any work, whether in Source or Object
-       form, that is based on (or derived from) the Work and for which the
-       editorial revisions, annotations, elaborations, or other modifications
-       represent, as a whole, an original work of authorship. For the purposes
-       of this License, Derivative Works shall not include works that remain
-       separable from, or merely link (or bind by name) to the interfaces of,
-       the Work and Derivative Works thereof.
-
-       "Contribution" shall mean any work of authorship, including
-       the original version of the Work and any modifications or additions
-       to that Work or Derivative Works thereof, that is intentionally
-       submitted to Licensor for inclusion in the Work by the copyright owner
-       or by an individual or Legal Entity authorized to submit on behalf of
-       the copyright owner. For the purposes of this definition, "submitted"
-       means any form of electronic, verbal, or written communication sent
-       to the Licensor or its representatives, including but not limited to
-       communication on electronic mailing lists, source code control systems,
-       and issue tracking systems that are managed by, or on behalf of, the
-       Licensor for the purpose of discussing and improving the Work, but
-       excluding communication that is conspicuously marked or otherwise
-       designated in writing by the copyright owner as "Not a Contribution."
-
-       "Contributor" shall mean Licensor and any individual or Legal Entity
-       on behalf of whom a Contribution has been received by Licensor and
-       subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       copyright license to reproduce, prepare Derivative Works of,
-       publicly display, publicly perform, sublicense, and distribute the
-       Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-       this License, each Contributor hereby grants to You a perpetual,
-       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-       (except as stated in this section) patent license to make, have made,
-       use, offer to sell, sell, import, and otherwise transfer the Work,
-       where such license applies only to those patent claims licensable
-       by such Contributor that are necessarily infringed by their
-       Contribution(s) alone or by combination of their Contribution(s)
-       with the Work to which such Contribution(s) was submitted. If You
-       institute patent litigation against any entity (including a
-       cross-claim or counterclaim in a lawsuit) alleging that the Work
-       or a Contribution incorporated within the Work constitutes direct
-       or contributory patent infringement, then any patent licenses
-       granted to You under this License for that Work shall terminate
-       as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-       Work or Derivative Works thereof in any medium, with or without
-       modifications, and in Source or Object form, provided that You
-       meet the following conditions:
-
-       (a) You must give any other recipients of the Work or
-           Derivative Works a copy of this License; and
-
-       (b) You must cause any modified files to carry prominent notices
-           stating that You changed the files; and
-
-       (c) You must retain, in the Source form of any Derivative Works
-           that You distribute, all copyright, patent, trademark, and
-           attribution notices from the Source form of the Work,
-           excluding those notices that do not pertain to any part of
-           the Derivative Works; and
-
-       (d) If the Work includes a "NOTICE" text file as part of its
-           distribution, then any Derivative Works that You distribute must
-           include a readable copy of the attribution notices contained
-           within such NOTICE file, excluding those notices that do not
-           pertain to any part of the Derivative Works, in at least one
-           of the following places: within a NOTICE text file distributed
-           as part of the Derivative Works; within the Source form or
-           documentation, if provided along with the Derivative Works; or,
-           within a display generated by the Derivative Works, if and
-           wherever such third-party notices normally appear. The contents
-           of the NOTICE file are for informational purposes only and
-           do not modify the License. You may add Your own attribution
-           notices within Derivative Works that You distribute, alongside
-           or as an addendum to the NOTICE text from the Work, provided
-           that such additional attribution notices cannot be construed
-           as modifying the License.
-
-       You may add Your own copyright statement to Your modifications and
-       may provide additional or different license terms and conditions
-       for use, reproduction, or distribution of Your modifications, or
-       for any such Derivative Works as a whole, provided Your use,
-       reproduction, and distribution of the Work otherwise complies with
-       the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-       any Contribution intentionally submitted for inclusion in the Work
-       by You to the Licensor shall be under the terms and conditions of
-       this License, without any additional terms or conditions.
-       Notwithstanding the above, nothing herein shall supersede or modify
-       the terms of any separate license agreement you may have executed
-       with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-       names, trademarks, service marks, or product names of the Licensor,
-       except as required for reasonable and customary use in describing the
-       origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-       agreed to in writing, Licensor provides the Work (and each
-       Contributor provides its Contributions) on an "AS IS" BASIS,
-       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-       implied, including, without limitation, any warranties or conditions
-       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-       PARTICULAR PURPOSE. You are solely responsible for determining the
-       appropriateness of using or redistributing the Work and assume any
-       risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-       whether in tort (including negligence), contract, or otherwise,
-       unless required by applicable law (such as deliberate and grossly
-       negligent acts) or agreed to in writing, shall any Contributor be
-       liable to You for damages, including any direct, indirect, special,
-       incidental, or consequential damages of any character arising as a
-       result of this License or out of the use or inability to use the
-       Work (including but not limited to damages for loss of goodwill,
-       work stoppage, computer failure or malfunction, or any and all
-       other commercial damages or losses), even if such Contributor
-       has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-       the Work or Derivative Works thereof, You may choose to offer,
-       and charge a fee for, acceptance of support, warranty, indemnity,
-       or other liability obligations and/or rights consistent with this
-       License. However, in accepting such obligations, You may act only
-       on Your own behalf and on Your sole responsibility, not on behalf
-       of any other Contributor, and only if You agree to indemnify,
-       defend, and hold each Contributor harmless for any liability
-       incurred by, or claims asserted against, such Contributor by reason
-       of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-       To apply the Apache License to your work, attach the following
-       boilerplate notice, with the fields enclosed by brackets "[]"
-       replaced with your own identifying information. (Don't include
-       the brackets!)  The text should be enclosed in the appropriate
-       comment syntax for the file format. We also recommend that a
-       file or class name and description of purpose be included on the
-       same "printed page" as the copyright notice for easier
-       identification within third-party archives.
-
-    Copyright [yyyy] [name of copyright owner]
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-        http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* googlenet-v3-pytorch, resnet-50-pytorch - the torchvision package https://github.com/pytorch/vision
-
-License terms:
-
-    BSD 3-Clause License
-
-    Copyright (c) Soumith Chintala 2016,
-    All rights reserved.
-
-    Redistribution and use in source and binary forms, with or without
-    modification, are permitted provided that the following conditions are met:
-
-    * Redistributions of source code must retain the above copyright notice, this
-      list of conditions and the following disclaimer.
-
-    * Redistributions in binary form must reproduce the above copyright notice,
-      this list of conditions and the following disclaimer in the documentation
-      and/or other materials provided with the distribution.
-
-    * Neither the name of the copyright holder nor the names of its
-      contributors may be used to endorse or promote products derived from
-      this software without specific prior written permission.
-
-    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-    AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-    IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-    DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
-    FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
-    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
-    SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
-    CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
-    OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-    OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-==================================================================================================
-
-* octave-densenet-121-0.125 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnet-26-0.25 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnet-50-0.125  - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnet-101-0.125 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnet-200-0.125 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnext-50-0.25 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-resnext-101-0.25 - octave convolution networks https://github.com/facebookresearch/OctConv
-* octave-se-resnet-50-0.125  - octave convolution networks https://github.com/facebookresearch/OctConv
-
-License terms:
-
-    MIT License
-
-    Copyright (c) Facebook, Inc. and its affiliates.
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
-
-* image-retrieval-0001 - an image retrieval model based on Mobilenet v2 as
-  a backbone. The model produces l2-normalized embeddings with dimension that
-  equals to 256.
-
-License terms:
-
-    Apache License
-    Version 2.0, January 2004
-    http://www.apache.org/licenses/
-
-    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-    1. Definitions.
-
-    "License" shall mean the terms and conditions for use, reproduction,
-    and distribution as defined by Sections 1 through 9 of this document.
-
-    "Licensor" shall mean the copyright owner or entity authorized by
-    the copyright owner that is granting the License.
-
-    "Legal Entity" shall mean the union of the acting entity and all
-    other entities that control, are controlled by, or are under common
-    control with that entity. For the purposes of this definition,
-    "control" means (i) the power, direct or indirect, to cause the
-    direction or management of such entity, whether by contract or
-    otherwise, or (ii) ownership of fifty percent (50%) or more of the
-    outstanding shares, or (iii) beneficial ownership of such entity.
-
-    "You" (or "Your") shall mean an individual or Legal Entity
-    exercising permissions granted by this License.
-
-    "Source" form shall mean the preferred form for making modifications,
-    including but not limited to software source code, documentation
-    source, and configuration files.
-
-    "Object" form shall mean any form resulting from mechanical
-    transformation or translation of a Source form, including but
-    not limited to compiled object code, generated documentation,
-    and conversions to other media types.
-
-    "Work" shall mean the work of authorship, whether in Source or
-    Object form, made available under the License, as indicated by a
-    copyright notice that is included in or attached to the work
-    (an example is provided in the Appendix below).
-
-    "Derivative Works" shall mean any work, whether in Source or Object
-    form, that is based on (or derived from) the Work and for which the
-    editorial revisions, annotations, elaborations, or other modifications
-    represent, as a whole, an original work of authorship. For the purposes
-    of this License, Derivative Works shall not include works that remain
-    separable from, or merely link (or bind by name) to the interfaces of,
-    the Work and Derivative Works thereof.
-
-    "Contribution" shall mean any work of authorship, including
-    the original version of the Work and any modifications or additions
-    to that Work or Derivative Works thereof, that is intentionally
-    submitted to Licensor for inclusion in the Work by the copyright owner
-    or by an individual or Legal Entity authorized to submit on behalf of
-    the copyright owner. For the purposes of this definition, "submitted"
-    means any form of electronic, verbal, or written communication sent
-    to the Licensor or its representatives, including but not limited to
-    communication on electronic mailing lists, source code control systems,
-    and issue tracking systems that are managed by, or on behalf of, the
-    Licensor for the purpose of discussing and improving the Work, but
-    excluding communication that is conspicuously marked or otherwise
-    designated in writing by the copyright owner as "Not a Contribution."
-
-    "Contributor" shall mean Licensor and any individual or Legal Entity
-    on behalf of whom a Contribution has been received by Licensor and
-    subsequently incorporated within the Work.
-
-    2. Grant of Copyright License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    copyright license to reproduce, prepare Derivative Works of,
-    publicly display, publicly perform, sublicense, and distribute the
-    Work and such Derivative Works in Source or Object form.
-
-    3. Grant of Patent License. Subject to the terms and conditions of
-    this License, each Contributor hereby grants to You a perpetual,
-    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-    (except as stated in this section) patent license to make, have made,
-    use, offer to sell, sell, import, and otherwise transfer the Work,
-    where such license applies only to those patent claims licensable
-    by such Contributor that are necessarily infringed by their
-    Contribution(s) alone or by combination of their Contribution(s)
-    with the Work to which such Contribution(s) was submitted. If You
-    institute patent litigation against any entity (including a
-    cross-claim or counterclaim in a lawsuit) alleging that the Work
-    or a Contribution incorporated within the Work constitutes direct
-    or contributory patent infringement, then any patent licenses
-    granted to You under this License for that Work shall terminate
-    as of the date such litigation is filed.
-
-    4. Redistribution. You may reproduce and distribute copies of the
-    Work or Derivative Works thereof in any medium, with or without
-    modifications, and in Source or Object form, provided that You
-    meet the following conditions:
-
-    (a) You must give any other recipients of the Work or
-    Derivative Works a copy of this License; and
-
-    (b) You must cause any modified files to carry prominent notices
-    stating that You changed the files; and
-
-    (c) You must retain, in the Source form of any Derivative Works
-    that You distribute, all copyright, patent, trademark, and
-    attribution notices from the Source form of the Work,
-    excluding those notices that do not pertain to any part of
-    the Derivative Works; and
-
-    (d) If the Work includes a "NOTICE" text file as part of its
-    distribution, then any Derivative Works that You distribute must
-    include a readable copy of the attribution notices contained
-    within such NOTICE file, excluding those notices that do not
-    pertain to any part of the Derivative Works, in at least one
-    of the following places: within a NOTICE text file distributed
-    as part of the Derivative Works; within the Source form or
-    documentation, if provided along with the Derivative Works; or,
-    within a display generated by the Derivative Works, if and
-    wherever such third-party notices normally appear. The contents
-    of the NOTICE file are for informational purposes only and
-    do not modify the License. You may add Your own attribution
-    notices within Derivative Works that You distribute, alongside
-    or as an addendum to the NOTICE text from the Work, provided
-    that such additional attribution notices cannot be construed
-    as modifying the License.
-
-    You may add Your own copyright statement to Your modifications and
-    may provide additional or different license terms and conditions
-    for use, reproduction, or distribution of Your modifications, or
-    for any such Derivative Works as a whole, provided Your use,
-    reproduction, and distribution of the Work otherwise complies with
-    the conditions stated in this License.
-
-    5. Submission of Contributions. Unless You explicitly state otherwise,
-    any Contribution intentionally submitted for inclusion in the Work
-    by You to the Licensor shall be under the terms and conditions of
-    this License, without any additional terms or conditions.
-    Notwithstanding the above, nothing herein shall supersede or modify
-    the terms of any separate license agreement you may have executed
-    with Licensor regarding such Contributions.
-
-    6. Trademarks. This License does not grant permission to use the trade
-    names, trademarks, service marks, or product names of the Licensor,
-    except as required for reasonable and customary use in describing the
-    origin of the Work and reproducing the content of the NOTICE file.
-
-    7. Disclaimer of Warranty. Unless required by applicable law or
-    agreed to in writing, Licensor provides the Work (and each
-    Contributor provides its Contributions) on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-    implied, including, without limitation, any warranties or conditions
-    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-    PARTICULAR PURPOSE. You are solely responsible for determining the
-    appropriateness of using or redistributing the Work and assume any
-    risks associated with Your exercise of permissions under this License.
-
-    8. Limitation of Liability. In no event and under no legal theory,
-    whether in tort (including negligence), contract, or otherwise,
-    unless required by applicable law (such as deliberate and grossly
-    negligent acts) or agreed to in writing, shall any Contributor be
-    liable to You for damages, including any direct, indirect, special,
-    incidental, or consequential damages of any character arising as a
-    result of this License or out of the use or inability to use the
-    Work (including but not limited to damages for loss of goodwill,
-    work stoppage, computer failure or malfunction, or any and all
-    other commercial damages or losses), even if such Contributor
-    has been advised of the possibility of such damages.
-
-    9. Accepting Warranty or Additional Liability. While redistributing
-    the Work or Derivative Works thereof, You may choose to offer,
-    and charge a fee for, acceptance of support, warranty, indemnity,
-    or other liability obligations and/or rights consistent with this
-    License. However, in accepting such obligations, You may act only
-    on Your own behalf and on Your sole responsibility, not on behalf
-    of any other Contributor, and only if You agree to indemnify,
-    defend, and hold each Contributor harmless for any liability
-    incurred by, or claims asserted against, such Contributor by reason
-    of your accepting any such warranty or additional liability.
-
-    END OF TERMS AND CONDITIONS
-
-    APPENDIX: How to apply the Apache License to your work.
-
-    To apply the Apache License to your work, attach the following
-    boilerplate notice, with the fields enclosed by brackets "[]"
-    replaced with your own identifying information. (Don't include
-    the brackets!)  The text should be enclosed in the appropriate
-    comment syntax for the file format. We also recommend that a
-    file or class name and description of purpose be included on the
-    same "printed page" as the copyright notice for easier
-    identification within third-party archives.
-
-    Copyright [yyyy] [name of copyright owner]
-
-    Licensed under the Apache License, Version 2.0 (the "License");
-    you may not use this file except in compliance with the License.
-    You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-    Unless required by applicable law or agreed to in writing, software
-    distributed under the License is distributed on an "AS IS" BASIS,
-    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-    See the License for the specific language governing permissions and
-    limitations under the License.
-
-==================================================================================================
-
-* models/public/face-recognition-resnet100-arcface - LResNet100E-IR,ArcFace@ms1m-refine-v2 - https://github.com/deepinsight/insightface
-* models/public/face-recognition-resnet50-arcface - LResNet50E-IR,ArcFace@ms1m-refine-v1 - https://github.com/deepinsight/insightface
-* models/public/face-recognition-resnet34-arcface - LResNet34E-IR,ArcFace@ms1m-refine-v1 - https://github.com/deepinsight/insightface
-* models/public/face-recognition-mobilefacenet-arcface - MobileFaceNet,ArcFace@ms1m-refine-v1  - https://github.com/deepinsight/insightface
-
-License terms:
-
-    MIT License
-
-    Copyright (c) 2018 Jiankang Deng and Jia Guo
-
-    Permission is hereby granted, free of charge, to any person obtaining a copy
-    of this software and associated documentation files (the "Software"), to deal
-    in the Software without restriction, including without limitation the rights
-    to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-    copies of the Software, and to permit persons to whom the Software is
-    furnished to do so, subject to the following conditions:
-
-    The above copyright notice and this permission notice shall be included in all
-    copies or substantial portions of the Software.
-
-    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-    OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-    SOFTWARE.
-
-==================================================================================================
diff --git a/tools/downloader/pytorch_to_onnx.py b/tools/downloader/pytorch_to_onnx.py
index 80dec8fcc17..1cd2d84d7fb 100644
--- a/tools/downloader/pytorch_to_onnx.py
+++ b/tools/downloader/pytorch_to_onnx.py
@@ -22,6 +22,17 @@ def positive_int_arg(values):
     return result
 
 
+def model_parameter(parameter):
+    param, value = parameter.split('=', 1)
+    try:
+        value = eval(value, {}, {})
+    except NameError as err:
+        print('Cannot evaluate {!r} value in {}. For string values use "{}=\'{}\'" (with all quotes).'
+              .format(value, parameter, param, value))
+        sys.exit(err)
+    return param, value
+
+
 def parse_args():
     """Parse input arguments"""
 
@@ -42,15 +53,16 @@ def parse_args():
     parser.add_argument('--import-module', type=str, default='',
                         help='Name of module, which contains model\'s constructor.'
                         'Requires if model not from Torchvision')
-    parser.add_argument('--input-names', type=str, nargs='+',
+    parser.add_argument('--input-names', type=str, metavar='L[,L...]',
                         help='Space separated names of the input layers')
-    parser.add_argument('--output-names', type=str, nargs='+',
+    parser.add_argument('--output-names', type=str, metavar='L[,L...]',
                         help='Space separated names of the output layers')
-
+    parser.add_argument('--model-param', type=model_parameter, default=[], action='append',
+                        help='Pair "name"="value" of model constructor parameter')
     return parser.parse_args()
 
 
-def load_model(model_name, weights, from_torchvision=True, model_path=None, module_name=None):
+def load_model(model_name, weights, from_torchvision, model_path, module_name, model_params):
     """Import model and load pretrained weights"""
 
     if from_torchvision:
@@ -72,7 +84,7 @@ def load_model(model_name, weights, from_torchvision=True, model_path=None, modu
         try:
             module = __import__(module_name)
             creator = getattr(module, model_name)
-            model = creator()
+            model = creator(**model_params)
         except ImportError as err:
             print('Module {} in {} doesn\'t exist. Check import path and name'.format(model_name, model_path))
             sys.exit(err)
@@ -95,8 +107,9 @@ def convert_to_onnx(model, input_shape, output_file, input_names, output_names):
     output_file.parent.mkdir(parents=True, exist_ok=True)
     model.eval()
     dummy_input = torch.randn(input_shape)
-    torch.onnx.export(model, dummy_input, str(output_file),
-                      verbose=False, input_names=input_names, output_names=output_names)
+    model(dummy_input)
+    torch.onnx.export(model, dummy_input, str(output_file), verbose=False,
+                      input_names=input_names.split(','), output_names=output_names.split(','))
 
     # Model check after conversion
     model = onnx.load(str(output_file))
@@ -109,7 +122,9 @@ def convert_to_onnx(model, input_shape, output_file, input_names, output_names):
 
 def main():
     args = parse_args()
-    model = load_model(args.model_name, args.weights, args.from_torchvision, args.model_path, args.import_module)
+    model = load_model(args.model_name, args.weights, args.from_torchvision,
+                       args.model_path, args.import_module, dict(args.model_param))
+
     convert_to_onnx(model, args.input_shape, args.output_file, args.input_names, args.output_names)
 
 
diff --git a/tools/downloader/requirements-caffe2.in b/tools/downloader/requirements-caffe2.in
new file mode 100644
index 00000000000..5f1ceb698af
--- /dev/null
+++ b/tools/downloader/requirements-caffe2.in
@@ -0,0 +1,3 @@
+future
+onnx
+torch
diff --git a/tools/downloader/tests/representative-models.lst b/tools/downloader/tests/representative-models.lst
index 81b4005e76d..f20286c989d 100644
--- a/tools/downloader/tests/representative-models.lst
+++ b/tools/downloader/tests/representative-models.lst
@@ -4,5 +4,6 @@ mobilenet-v1-0.25-128 # TensorFlow, HTTP downloads
 mobilenet-v2-pytorch # PyTorch (external module), Google Drive downloads
 mtcnn-p # Caffe, HTTPS downloads, regex replacement
 octave-densenet-121-0.125 # MXNet, archive unpacking
+resnet-50-caffe2 # Caffe2
 resnet-50-pytorch # PyTorch (torchvision)
 single-image-super-resolution-1032 # DLDT