#include "ANSONNXPOSE.h" #include "EPLoader.h" namespace ANSCENTER { std::atomic ANSONNXPOSE::instanceCounter_(0); // Initialize static member size_t ANSONNXPOSE::vectorProduct(const std::vector& vector) { return std::accumulate(vector.begin(), vector.end(), 1ull, std::multiplies()); } void ANSONNXPOSE::letterBox(const cv::Mat& image, cv::Mat& outImage, const cv::Size& newShape, const cv::Scalar& color, bool auto_, bool scaleFill, bool scaleUp, int stride) { // Calculate the scaling ratio to fit the image within the new shape float ratio = std::min(static_cast(newShape.height) / image.rows, static_cast(newShape.width) / image.cols); // Prevent scaling up if not allowed if (!scaleUp) { ratio = std::min(ratio, 1.0f); } // Calculate new dimensions after scaling int newUnpadW = static_cast(std::round(image.cols * ratio)); int newUnpadH = static_cast(std::round(image.rows * ratio)); // Calculate padding needed to reach the desired shape int dw = newShape.width - newUnpadW; int dh = newShape.height - newUnpadH; if (auto_) { // Ensure padding is a multiple of stride for model compatibility dw = (dw % stride) / 2; dh = (dh % stride) / 2; } else if (scaleFill) { // Scale to fill without maintaining aspect ratio newUnpadW = newShape.width; newUnpadH = newShape.height; ratio = std::min(static_cast(newShape.width) / image.cols, static_cast(newShape.height) / image.rows); dw = 0; dh = 0; } else { // Evenly distribute padding on both sides // Calculate separate padding for left/right and top/bottom to handle odd padding int padLeft = dw / 2; int padRight = dw - padLeft; int padTop = dh / 2; int padBottom = dh - padTop; // Resize the image if the new dimensions differ if (image.cols != newUnpadW || image.rows != newUnpadH) { cv::resize(image, outImage, cv::Size(newUnpadW, newUnpadH), 0, 0, cv::INTER_LINEAR); } else { // Avoid unnecessary copying if dimensions are the same outImage = image; } // Apply padding to reach the desired shape cv::copyMakeBorder(outImage, outImage, padTop, padBottom, padLeft, padRight, cv::BORDER_CONSTANT, color); return; // Exit early since padding is already applied } // Resize the image if the new dimensions differ if (image.cols != newUnpadW || image.rows != newUnpadH) { cv::resize(image, outImage, cv::Size(newUnpadW, newUnpadH), 0, 0, cv::INTER_LINEAR); } else { // Avoid unnecessary copying if dimensions are the same outImage = image; } // Calculate separate padding for left/right and top/bottom to handle odd padding int padLeft = dw / 2; int padRight = dw - padLeft; int padTop = dh / 2; int padBottom = dh - padTop; // Apply padding to reach the desired shape cv::copyMakeBorder(outImage, outImage, padTop, padBottom, padLeft, padRight, cv::BORDER_CONSTANT, color); } void ANSONNXPOSE::NMSBoxes(const std::vector& boundingBoxes, const std::vector& scores, float scoreThreshold, float nmsThreshold, std::vector& indices) { indices.clear(); const size_t numBoxes = boundingBoxes.size(); if (numBoxes == 0) { DEBUG_PRINT("No bounding boxes to process in NMS"); return; } // Step 1: Filter out boxes with scores below the threshold // and create a list of indices sorted by descending scores std::vector sortedIndices; sortedIndices.reserve(numBoxes); for (size_t i = 0; i < numBoxes; ++i) { if (scores[i] >= scoreThreshold) { sortedIndices.push_back(static_cast(i)); } } // If no boxes remain after thresholding if (sortedIndices.empty()) { DEBUG_PRINT("No bounding boxes above score threshold"); return; } // Sort the indices based on scores in descending order std::sort(sortedIndices.begin(), sortedIndices.end(), [&scores](int idx1, int idx2) { return scores[idx1] > scores[idx2]; }); // Step 2: Precompute the areas of all boxes std::vector areas(numBoxes, 0.0f); for (size_t i = 0; i < numBoxes; ++i) { areas[i] = boundingBoxes[i].width * boundingBoxes[i].height; } // Step 3: Suppression mask to mark boxes that are suppressed std::vector suppressed(numBoxes, false); // Step 4: Iterate through the sorted list and suppress boxes with high IoU for (size_t i = 0; i < sortedIndices.size(); ++i) { int currentIdx = sortedIndices[i]; if (suppressed[currentIdx]) { continue; } // Select the current box as a valid detection indices.push_back(currentIdx); const BoundingBox& currentBox = boundingBoxes[currentIdx]; const float x1_max = currentBox.x; const float y1_max = currentBox.y; const float x2_max = currentBox.x + currentBox.width; const float y2_max = currentBox.y + currentBox.height; const float area_current = areas[currentIdx]; // Compare IoU of the current box with the rest for (size_t j = i + 1; j < sortedIndices.size(); ++j) { int compareIdx = sortedIndices[j]; if (suppressed[compareIdx]) { continue; } const BoundingBox& compareBox = boundingBoxes[compareIdx]; const float x1 = std::max(x1_max, static_cast(compareBox.x)); const float y1 = std::max(y1_max, static_cast(compareBox.y)); const float x2 = std::min(x2_max, static_cast(compareBox.x + compareBox.width)); const float y2 = std::min(y2_max, static_cast(compareBox.y + compareBox.height)); const float interWidth = x2 - x1; const float interHeight = y2 - y1; if (interWidth <= 0 || interHeight <= 0) { continue; } const float intersection = interWidth * interHeight; const float unionArea = area_current + areas[compareIdx] - intersection; const float iou = (unionArea > 0.0f) ? (intersection / unionArea) : 0.0f; if (iou > nmsThreshold) { suppressed[compareIdx] = true; } } } DEBUG_PRINT("NMS completed with " + std::to_string(indices.size()) + " indices remaining"); } void ANSONNXPOSE::drawPoseEstimation(cv::Mat& image, const std::vector