openvinotoolkit
diff --git a/‎docs/binary_input.md
+8-2 b/‎docs/binary_input.md
+8-2
diff --git a/‎src/binaryutils.cpp
+111-81 b/‎src/binaryutils.cpp
+111-81
diff --git a/‎src/binaryutils.hpp
+1-1 b/‎src/binaryutils.hpp
+1-1
diff --git a/‎src/deserialization.hpp
+1-1 b/‎src/deserialization.hpp
+1-1
@@ -19,11 +19,17 @@ is out of range it will be adjusted to the nearer border. For example, when mode
 - if input shape is [1,90,200,3] it will be resized into [1,100,200,3]
 - if input shape is [1,220,200,3] it will be resized into [1,200,200,3]
 
-Processing the binary image requests requires the model or the custom nodes to accept NHWC layout in BGR color 
+In order to use binary input functionality, model or pipeline input layout needs to be compatible with `N...HWC` and have 4 (or 5 in case of demultiplexing) shape dimensions. It means that input layout needs to resemble `NHWC` layout, e.g. default `N...` will work. On the other hand, binary image input is not supported for inputs with `NCHW` layout. 
+
+To fully utilize binary input utility, automatic image size alignment will be done by OVMS when:
+- input shape does not include dynamic dimension value (`-1`)
+- input layout is configured to be either `...` (custom nodes) and `NHWC` or `N?HWC` (or `N?HWC`, when modified by a [demultiplexer](demultiplexing.md))
+
+Processing the binary image requests requires the model or the custom nodes to accept BGR color 
 format with data with the data range from 0-255. Original layout of the input data can be changed in the 
 OVMS configuration in runtime. For example when the orignal model has input shape [1,3,224,224] add a parameter
 in the OVMS configuration "layout": "NHWC:NCHW" or the command line parameter `--layout NHWC:NCHW`. In result, the model will
-have effective shape [1,224,224,3].
+have effective shape [1,224,224,3] and layout `NHWC`.
 
 In case the model was trained with color format RGB and range other then 0-255, the 
 [model optimizer](tf_model_binary_input.md) 
 
@@ -72,7 +72,7 @@ cv::Mat convertStringValToMat(const std::string& stringVal) {
     try {
         return cv::imdecode(dataMat, cv::IMREAD_UNCHANGED);
     } catch (const cv::Exception& e) {
-        SPDLOG_ERROR("Error during string_val to mat conversion: {}", e.what());
+        SPDLOG_DEBUG("Error during string_val to mat conversion: {}", e.what());
         return cv::Mat{};
     }
 }
@@ -89,79 +89,25 @@ Status convertPrecision(const cv::Mat& src, cv::Mat& dst, const ovms::Precision
 }
 
 Status validateLayout(const std::shared_ptr<TensorInfo>& tensorInfo) {
-    if ((tensorInfo->getLayout() != "NHWC") &&
-        (tensorInfo->getLayout() != Layout::getUnspecifiedLayout()) &&  // handle DAG
-        (tensorInfo->getLayout() != Layout::getDefaultLayout())) {      // handle model without Layout set
+    static const std::string binarySupportedLayout = "N...HWC";
+    if (!tensorInfo->getLayout().createIntersection(Layout(binarySupportedLayout), tensorInfo->getShape().size()).has_value()) {
+        SPDLOG_DEBUG("Endpoint needs to be compatible with {} to support binary image inputs, actual: {}",
+            binarySupportedLayout,
+            tensorInfo->getLayout());
         return StatusCode::UNSUPPORTED_LAYOUT;
     }
     return StatusCode::OK;
 }
 
-bool resizeNeeded(const cv::Mat& image, const std::shared_ptr<TensorInfo>& tensorInfo) {
-    Dimension cols = Dimension::any();
-    Dimension rows = Dimension::any();
-    if (tensorInfo->getShape().size() == 4) {
-        cols = tensorInfo->getShape()[2];
-        rows = tensorInfo->getShape()[1];
-    } else if (tensorInfo->isInfluencedByDemultiplexer() && tensorInfo->getShape().size() == 5) {
-        cols = tensorInfo->getShape()[3];
-        rows = tensorInfo->getShape()[2];
-    } else {
-        return false;
-    }
-    if (cols.isAny()) {
-        cols = image.cols;
-    }
-    if (rows.isAny()) {
-        rows = image.rows;
-    }
-    if ((!cols.match(image.cols)) || (!rows.match(image.rows))) {
+bool resizeNeeded(const cv::Mat& image, const dimension_value_t height, const dimension_value_t width) {
+    if (height != image.rows || width != image.cols) {
         return true;
     }
     return false;
 }
 
-Status resizeMat(const cv::Mat& src, cv::Mat& dst, const std::shared_ptr<TensorInfo>& tensorInfo) {
-    Dimension cols = Dimension::any();
-    Dimension rows = Dimension::any();
-    if (tensorInfo->getShape().size() == 4) {
-        cols = tensorInfo->getShape()[2];
-        rows = tensorInfo->getShape()[1];
-    } else if (tensorInfo->isInfluencedByDemultiplexer() && tensorInfo->getShape().size() == 5) {
-        cols = tensorInfo->getShape()[3];
-        rows = tensorInfo->getShape()[2];
-    } else {
-        return StatusCode::UNSUPPORTED_LAYOUT;
-    }
-    if (cols.isAny()) {
-        cols = src.cols;
-    }
-    if (rows.isAny()) {
-        rows = src.rows;
-    }
-    if (cols.isDynamic()) {
-        dimension_value_t value = src.cols;
-        if (src.cols < cols.getMinValue())
-            value = cols.getMinValue();
-
-        if (src.cols > cols.getMaxValue())
-            value = cols.getMaxValue();
-
-        if (value != src.cols)
-            cols = Dimension(value);
-    }
-    if (rows.isDynamic()) {
-        dimension_value_t value = src.rows;
-        if (src.rows < rows.getMinValue())
-            value = rows.getMinValue();
-
-        if (src.rows > rows.getMaxValue())
-            value = rows.getMaxValue();
-
-        if (value != src.rows)
-            rows = Dimension(value);
-    }
-    cv::resize(src, dst, cv::Size(cols.getStaticValue(), rows.getStaticValue()));
+Status resizeMat(const cv::Mat& src, cv::Mat& dst, const dimension_value_t height, const dimension_value_t width) {
+    cv::resize(src, dst, cv::Size(width, height));
     return StatusCode::OK;
 }
 
@@ -199,7 +145,7 @@ Status validateResolutionAgainstFirstBatchImage(const cv::Mat input, cv::Mat* fi
     if (input.cols == firstBatchImage->cols && input.rows == firstBatchImage->rows) {
         return StatusCode::OK;
     }
-    SPDLOG_ERROR("Each binary image in request needs to have resolution matched. First cols: {}, rows: {}, current cols: {}, rows: {}",
+    SPDLOG_DEBUG("Each binary image in request needs to have resolution matched. First cols: {}, rows: {}, current cols: {}, rows: {}",
         firstBatchImage->cols, firstBatchImage->rows, input.cols, input.rows);
     return StatusCode::BINARY_IMAGES_RESOLUTION_MISMATCH;
 }
@@ -212,14 +158,13 @@ bool checkBatchSizeMismatch(const std::shared_ptr<TensorInfo>& tensorInfo,
     return !tensorInfo->getBatchSize().value().match(batchSize);
 }
 
-Status validateInput(const std::shared_ptr<TensorInfo>& tensorInfo, const cv::Mat input, cv::Mat* firstBatchImage) {
-    // For pipelines with only custom nodes entry, or models with default layout there is no way to deduce layout.
-    // With unknown layout, there is no way to deduce pipeline input resolution.
-    // This forces binary utility to create tensors with resolution inherited from input binary image from request.
-    // To achieve it, in this specific case we require all binary images to have the same resolution.
-    // TODO check if H/W is undefined and only then check this CVS-77193
-    if (firstBatchImage &&
-        (tensorInfo->getLayout() == Layout::getUnspecifiedLayout())) {
+Status validateInput(const std::shared_ptr<TensorInfo>& tensorInfo, const cv::Mat input, cv::Mat* firstBatchImage, bool enforceResolutionAlignment) {
+    // Binary inputs are supported for any endpoint that is compatible with N...HWC layout.
+    // With unknown layout, there is no way to deduce expected endpoint input resolution.
+    // This forces binary utility to create tensors with resolution inherited from first batch of binary input image (request).
+    // In case of any dimension in endpoint shape is dynamic, we need to validate images against first image resolution.
+    // Otherwise we can omit that, and proceed to image resize.
+    if (firstBatchImage && enforceResolutionAlignment) {
         auto status = validateResolutionAgainstFirstBatchImage(input, firstBatchImage);
         if (!status.ok()) {
             return status;
@@ -258,17 +203,90 @@ Status validateTensor(const std::shared_ptr<TensorInfo>& tensorInfo,
     return StatusCode::OK;
 }
 
+Dimension getTensorInfoHeightDim(const std::shared_ptr<TensorInfo>& tensorInfo) {
+    size_t numberOfShapeDimensions = tensorInfo->getShape().size();
+    if (numberOfShapeDimensions < 4 || numberOfShapeDimensions > 5) {
+        throw std::logic_error("wrong number of shape dimensions");
+    }
+    size_t position = numberOfShapeDimensions == 4 ? /*NHWC*/ 1 : /*N?HWC*/ 2;
+    return tensorInfo->getShape()[position];
+}
+
+Dimension getTensorInfoWidthDim(const std::shared_ptr<TensorInfo>& tensorInfo) {
+    size_t numberOfShapeDimensions = tensorInfo->getShape().size();
+    if (numberOfShapeDimensions < 4 || numberOfShapeDimensions > 5) {
+        throw std::logic_error("wrong number of shape dimensions");
+    }
+    size_t position = numberOfShapeDimensions == 4 ? /*NHWC*/ 2 : /*N?HWC*/ 3;
+    return tensorInfo->getShape()[position];
+}
+
+void updateTargetResolution(Dimension& height, Dimension& width, const cv::Mat& image) {
+    if (height.isAny()) {
+        height = image.rows;
+    } else if (height.isDynamic()) {
+        if (height.match(image.rows)) {
+            height = image.rows;
+        } else {
+            if (image.rows > height.getMaxValue()) {
+                height = height.getMaxValue();
+            } else {
+                height = height.getMinValue();
+            }
+        }
+    }
+    if (width.isAny()) {
+        width = image.cols;
+    } else if (width.isDynamic()) {
+        if (width.match(image.cols)) {
+            width = image.cols;
+        } else {
+            if (image.cols > width.getMaxValue()) {
+                width = width.getMaxValue();
+            } else {
+                width = width.getMinValue();
+            }
+        }
+    }
+}
+
+bool isResizeSupported(const std::shared_ptr<TensorInfo>& tensorInfo) {
+    for (const auto& dim : tensorInfo->getShape()) {
+        if (dim.isAny()) {
+            return false;
+        }
+    }
+    if (tensorInfo->getLayout() != "NHWC" &&
+        tensorInfo->getLayout() != "N?HWC" &&
+        tensorInfo->getLayout() != Layout::getUnspecifiedLayout()) {
+        return false;
+    }
+    return true;
+}
+
 Status convertTensorToMatsMatchingTensorInfo(const tensorflow::TensorProto& src, std::vector<cv::Mat>& images, const std::shared_ptr<TensorInfo>& tensorInfo) {
+    Dimension targetHeight = getTensorInfoHeightDim(tensorInfo);
+    Dimension targetWidth = getTensorInfoWidthDim(tensorInfo);
+
+    // Enforce resolution alignment against first image in the batch if resize is not supported.
+    bool resizeSupported = isResizeSupported(tensorInfo);
+    bool enforceResolutionAlignment = !resizeSupported;
+
     for (int i = 0; i < src.string_val_size(); i++) {
         cv::Mat image = convertStringValToMat(src.string_val(i));
         if (image.data == nullptr)
             return StatusCode::IMAGE_PARSING_FAILED;
 
         cv::Mat* firstImage = images.size() == 0 ? nullptr : &images.at(0);
-        auto status = validateInput(tensorInfo, image, firstImage);
+        auto status = validateInput(tensorInfo, image, firstImage, enforceResolutionAlignment);
         if (status != StatusCode::OK) {
             return status;
         }
+
+        if (i == 0) {
+            updateTargetResolution(targetHeight, targetWidth, image);
+        }
+
         if (!isPrecisionEqual(image.depth(), tensorInfo->getPrecision())) {
             cv::Mat imageCorrectPrecision;
             status = convertPrecision(image, imageCorrectPrecision, tensorInfo->getPrecision());
@@ -278,14 +296,26 @@ Status convertTensorToMatsMatchingTensorInfo(const tensorflow::TensorProto& src,
             }
             image = std::move(imageCorrectPrecision);
         }
-        if (resizeNeeded(image, tensorInfo)) {
+        if (!targetHeight.isStatic() || !targetWidth.isStatic()) {
+            return StatusCode::INTERNAL_ERROR;
+        }
+        if (resizeNeeded(image, targetHeight.getStaticValue(), targetWidth.getStaticValue())) {
+            if (!resizeSupported) {
+                return StatusCode::INVALID_SHAPE;
+            }
             cv::Mat imageResized;
-            status = resizeMat(image, imageResized, tensorInfo);
+            status = resizeMat(image, imageResized, targetHeight.getStaticValue(), targetWidth.getStaticValue());
             if (!status.ok()) {
                 return status;
             }
             image = std::move(imageResized);
         }
+
+        if (i == 0 && src.string_val_size() > 1) {
+            // TODO: CVS-78796 Check if the total bytes for tensor will not exceed 1GB.
+            // Multiply src.string_val_size() * image resolution * precision size
+        }
+
         images.push_back(image);
     }
 
@@ -304,7 +334,7 @@ shape_t getShapeFromImages(const std::vector<cv::Mat>& images, const std::shared
     return dims;
 }
 
-ov::Tensor createTensorFromMats(const std::vector<cv::Mat>& images, const std::shared_ptr<TensorInfo>& tensorInfo, bool isPipeline) {
+ov::Tensor createTensorFromMats(const std::vector<cv::Mat>& images, const std::shared_ptr<TensorInfo>& tensorInfo) {
     ov::Shape shape = getShapeFromImages(images, tensorInfo);
     ov::element::Type precision = tensorInfo->getOvPrecision();
     ov::Tensor tensor(precision, shape);
@@ -316,7 +346,7 @@ ov::Tensor createTensorFromMats(const std::vector<cv::Mat>& images, const std::s
     return tensor;
 }
 
-ov::Tensor convertMatsToTensor(std::vector<cv::Mat>& images, const std::shared_ptr<TensorInfo>& tensorInfo, bool isPipeline) {
+ov::Tensor convertMatsToTensor(std::vector<cv::Mat>& images, const std::shared_ptr<TensorInfo>& tensorInfo) {
     switch (tensorInfo->getPrecision()) {
     case ovms::Precision::FP32:
     case ovms::Precision::I32:
@@ -326,7 +356,7 @@ ov::Tensor convertMatsToTensor(std::vector<cv::Mat>& images, const std::shared_p
     case ovms::Precision::FP16:
     case ovms::Precision::U16:
     case ovms::Precision::I16:
-        return createTensorFromMats(images, tensorInfo, isPipeline);
+        return createTensorFromMats(images, tensorInfo);
     case ovms::Precision::MIXED:
     case ovms::Precision::Q78:
     case ovms::Precision::BIN:
@@ -337,7 +367,7 @@ ov::Tensor convertMatsToTensor(std::vector<cv::Mat>& images, const std::shared_p
     }
 }
 
-Status convertStringValToTensor(const tensorflow::TensorProto& src, ov::Tensor& tensor, const std::shared_ptr<TensorInfo>& tensorInfo, bool isPipeline) {
+Status convertStringValToTensor(const tensorflow::TensorProto& src, ov::Tensor& tensor, const std::shared_ptr<TensorInfo>& tensorInfo) {
     auto status = validateTensor(tensorInfo, src);
     if (status != StatusCode::OK) {
         return status;
@@ -350,7 +380,7 @@ Status convertStringValToTensor(const tensorflow::TensorProto& src, ov::Tensor&
         return status;
     }
 
-    tensor = convertMatsToTensor(images, tensorInfo, isPipeline);
+    tensor = convertMatsToTensor(images, tensorInfo);
     if (!tensor) {
         return StatusCode::IMAGE_PARSING_FAILED;
     }
 
@@ -21,5 +21,5 @@
 #include "tensorinfo.hpp"
 
 namespace ovms {
-Status convertStringValToTensor(const tensorflow::TensorProto& src, ov::Tensor& tensor, const std::shared_ptr<TensorInfo>& tensorInfo, bool isPipeline);
+Status convertStringValToTensor(const tensorflow::TensorProto& src, ov::Tensor& tensor, const std::shared_ptr<TensorInfo>& tensorInfo);
 }  // namespace ovms
@@ -124,7 +124,7 @@ Status deserializePredictRequest(
 
             if (requestInput.dtype() == tensorflow::DataType::DT_STRING) {
                 SPDLOG_DEBUG("Request contains binary input: {}", name);
-                status = convertStringValToTensor(requestInput, tensor, tensorInfo, isPipeline);
+                status = convertStringValToTensor(requestInput, tensor, tensorInfo);
                 if (!status.ok()) {
                     SPDLOG_DEBUG("Binary inputs conversion failed.");
                     return status;