#include "ANSFRCommon.h" #include "dirent.h" #include #include #include #include #include namespace ANSCENTER { constexpr size_t ndetections = 200; template T GetData(const boost::property_tree::ptree& pt, const std::string& key) { T ret; if (boost::optional data = pt.get_optional(key)) { ret = data.get(); } return ret; } Face::Face(size_t id, cv::Rect& location) : _location(location), _intensity_mean(0.f), _id(id), _age(-1), _maleScore(0), _femaleScore(0), _realFaceConfidence(0), _isAgeGenderEnabled(false), _isEmotionsEnabled(false), _isHeadPoseEnabled(false), _isLandmarksEnabled(false), _isAntispoofingEnabled(false) { HeadPoseResults headPose; headPose.angle_p = 0.f; headPose.angle_r = 0.f; headPose.angle_y = 0.f; _headPose = headPose; } void Face::updateAge(float value) { _age = (_age == -1) ? value : 0.95f * _age + 0.05f * value; } void Face::updateGender(float value) { if (value < 0) return; if (value > 0.5) { _maleScore += value - 0.5f; } else { _femaleScore += 0.5f - value; } } void Face::updateEmotions(std::map values) { for (auto& kv : values) { if (_emotions.find(kv.first) == _emotions.end()) { _emotions[kv.first] = kv.second; } else { _emotions[kv.first] = 0.9f * _emotions[kv.first] + 0.1f * kv.second; } } } void Face::updateHeadPose(HeadPoseResults values) { _headPose = values; } void Face::updateLandmarks(std::vector values) { _landmarks = std::move(values); } void Face::updateRealFaceConfidence(float value) { _realFaceConfidence = value; } void Face::updateFaceLiveness(int value) { _faceLiveness = value; } int Face::getAge() { return static_cast(std::floor(_age + 0.5f)); } bool Face::isMale() { return _maleScore > _femaleScore; } bool Face::isReal() { return _realFaceConfidence > 0.4; } float Face::getAntispoofingScore() { return _realFaceConfidence; } int Face::getFaceLiveness() { return _faceLiveness; } std::map Face::getEmotions() { return _emotions; } std::pair Face::getMainEmotion() { auto x = std::max_element(_emotions.begin(), _emotions.end(), [](const std::pair& p1, const std::pair& p2) { return p1.second < p2.second; }); return std::make_pair(x->first, x->second); } HeadPoseResults Face::getHeadPose() { return _headPose; } const std::vector& Face::getLandmarks() { return _landmarks; } size_t Face::getId() { return _id; } void Face::ageGenderEnable(bool value) { _isAgeGenderEnabled = value; } void Face::emotionsEnable(bool value) { _isEmotionsEnabled = value; } void Face::headPoseEnable(bool value) { _isHeadPoseEnabled = value; } void Face::landmarksEnable(bool value) { _isLandmarksEnabled = value; } void Face::antispoofingEnable(bool value) { _isAntispoofingEnabled = value; } void Face::faceLivenessEnable(bool value) { _isFaceLivenessEnabled = value; } bool Face::isAgeGenderEnabled() { return _isAgeGenderEnabled; } bool Face::isEmotionsEnabled() { return _isEmotionsEnabled; } bool Face::isHeadPoseEnabled() { return _isHeadPoseEnabled; } bool Face::isLandmarksEnabled() { return _isLandmarksEnabled; } bool Face::isAntispoofingEnabled() { return _isAntispoofingEnabled; } bool Face::isFaceLivenessEnabled() { return _isFaceLivenessEnabled; } float calcIoU(cv::Rect& src, cv::Rect& dst) { cv::Rect i = src & dst; cv::Rect u = src | dst; return static_cast(i.area()) / static_cast(u.area()); } float calcMean(const cv::Mat& src) { cv::Mat tmp; cv::cvtColor(src, tmp, cv::COLOR_BGR2GRAY); cv::Scalar mean = cv::mean(tmp); return static_cast(mean[0]); } Face matchFace(cv::Rect rect, std::list& faces) { Face face(0,rect); float maxIoU = 0.55f; for (auto&& f : faces) { float iou = calcIoU(rect, f._location); if (iou > maxIoU) { face = f; maxIoU = iou; } } return face; } BaseDetection::BaseDetection(const std::string& pathToModel, bool doRawOutputMessages) : pathToModel(pathToModel), doRawOutputMessages(doRawOutputMessages) { } bool BaseDetection::enabled() const { return bool(request); } AntispoofingClassifier::AntispoofingClassifier(const std::string& pathToModel, bool doRawOutputMessages) : BaseDetection(pathToModel, doRawOutputMessages) { _modelFilePath = pathToModel; } float AntispoofingClassifier::runInfer(const cv::Mat& frame) { std::lock_guard lock(_mutex); try { cv::Mat face = frame.clone(); auto inSlice = ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }; resize2tensor(face, inSlice); request.set_input_tensor(ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }); request.infer(); face.release(); float r = request.get_output_tensor().data()[0] * 100; return r; } catch (const std::exception& error) { std::cerr << "Error: " << error.what() << std::endl; return -1; } } std::shared_ptr AntispoofingClassifier::read(const ov::Core& core) { slog::info << "Reading model: " << _modelFilePath << slog::endl; std::shared_ptr model = core.read_model(_modelFilePath); ov::preprocess::PrePostProcessor ppp(model); ppp.input().tensor(). set_element_type(ov::element::u8). set_layout("NHWC"); ppp.input().preprocess().convert_layout("NCHW"); ppp.output().tensor().set_element_type(ov::element::f32); model = ppp.build(); inShape = model->input().get_shape(); inShape[0] = ndetections; //ov::set_batch(model, { 1, int64_t(ndetections) }); ov::set_batch(model, { 1 }); // Force single batch for all inputs return model; } AgeGenderDetection::AgeGenderDetection(const std::string& pathToModel, bool doRawOutputMessages) : BaseDetection(pathToModel, doRawOutputMessages) { _modelFilePath = pathToModel; } AgeGenderResults AgeGenderDetection::runInfer(const cv::Mat& frame) { std::lock_guard lock(_mutex); try { cv::Mat face = frame.clone(); auto inSlice = ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }; resize2tensor(face, inSlice); request.set_input_tensor(ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }); request.infer(); face.release(); AgeGenderResults r = { request.get_tensor(outputAge).data()[0] * 100, request.get_tensor(outputGender).data()[0 * 2 + 1] }; return r; } catch (const std::exception& error) { AgeGenderResults r = { -1, -1 }; return r; } } std::shared_ptr AgeGenderDetection::read(const ov::Core& core) { slog::info << "Reading model: " << _modelFilePath << slog::endl; std::shared_ptr model = core.read_model(_modelFilePath); outputAge = "age_conv3"; outputGender = "prob"; ov::preprocess::PrePostProcessor ppp(model); ppp.input().tensor(). set_element_type(ov::element::u8). set_layout("NHWC"); ppp.input().preprocess(). convert_element_type(ov::element::f32). convert_layout("NCHW"); ppp.output(outputAge).tensor().set_element_type(ov::element::f32); ppp.output(outputGender).tensor().set_element_type(ov::element::f32); model = ppp.build(); inShape = model->input().get_shape(); inShape[0] = ndetections; //ov::set_batch(model, { 1, int64_t(ndetections) }); ov::set_batch(model, { 1 }); // Force single batch for all inputs return model; } HeadPoseDetection::HeadPoseDetection(const std::string& pathToModel, bool doRawOutputMessages) : BaseDetection(pathToModel, doRawOutputMessages), outputAngleR("angle_r_fc"), outputAngleP("angle_p_fc"), outputAngleY("angle_y_fc") { _modelFilePath = pathToModel; } HeadPoseResults HeadPoseDetection::runInfer(const cv::Mat& frame) { std::lock_guard lock(_mutex); try { cv::Mat face = frame.clone(); auto inSlice = ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }; resize2tensor(face, inSlice); request.set_input_tensor(ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }); request.infer(); face.release(); HeadPoseResults r = { request.get_tensor(outputAngleR).data()[0], request.get_tensor(outputAngleP).data()[0], request.get_tensor(outputAngleY).data()[0] }; return r; } catch (const std::exception& error) { HeadPoseResults r = { -1, -1, -1 }; return r; } } std::shared_ptr HeadPoseDetection::read(const ov::Core& core) { std::shared_ptr model = core.read_model(_modelFilePath); ov::preprocess::PrePostProcessor ppp(model); ppp.input().tensor(). set_element_type(ov::element::u8). set_layout("NHWC"); ppp.input().preprocess().convert_layout("NCHW"); ppp.output(outputAngleR).tensor().set_element_type(ov::element::f32); ppp.output(outputAngleP).tensor().set_element_type(ov::element::f32); ppp.output(outputAngleY).tensor().set_element_type(ov::element::f32); model = ppp.build(); inShape = model->input().get_shape(); inShape[0] = ndetections; //ov::set_batch(model, { 1, int64_t(ndetections) }); ov::set_batch(model, { 1 }); // Force single batch for all inputs return model; } EmotionsDetection::EmotionsDetection(const std::string& pathToModel, bool doRawOutputMessages) : BaseDetection(pathToModel, doRawOutputMessages) { _modelFilePath = pathToModel; } std::map EmotionsDetection::runInfer(const cv::Mat& frame) { std::lock_guard lock(_mutex); try { cv::Mat face = frame.clone(); auto inSlice = ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }; resize2tensor(face, inSlice); request.set_input_tensor(ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }); request.infer(); face.release(); auto tensor = request.get_output_tensor(); auto emotionsVecSize = emotionsVec.size(); size_t numOfChannels = tensor.get_shape().at(1); if (numOfChannels == emotionsVecSize) { const float* emotionsValues = tensor.data(); auto outputIdxPos = emotionsValues + 0 * emotionsVecSize; std::map emotions; for (size_t i = 0; i < emotionsVecSize; i++) { emotions[emotionsVec[i]] = outputIdxPos[i]; } return emotions; } else return { }; } catch (const std::exception& error) { std::cerr << "Error: " << error.what() << std::endl; return { }; } } std::shared_ptr EmotionsDetection::read(const ov::Core& core) { slog::info << "Reading model: " << _modelFilePath << slog::endl; std::shared_ptr model = core.read_model(_modelFilePath); ov::preprocess::PrePostProcessor ppp(model); ppp.input().tensor(). set_element_type(ov::element::u8). set_layout("NHWC"); ppp.input().preprocess().convert_layout("NCHW"); ppp.output().tensor().set_element_type(ov::element::f32); model = ppp.build(); inShape = model->input().get_shape(); inShape[0] = ndetections; //ov::set_batch(model, { 1, int64_t(ndetections) }); ov::set_batch(model, { 1 }); // Force single batch for all inputs return model; } FacialLandmarksDetection::FacialLandmarksDetection(const std::string& pathToModel, bool doRawOutputMessages) : BaseDetection(pathToModel, doRawOutputMessages) { _modelFilePath = pathToModel; } std::vector FacialLandmarksDetection::runInfer(const cv::Mat& frame) { std::lock_guard lock(_mutex); std::vector normedLandmarks; try { cv::Mat face = frame.clone(); auto inSlice = ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }; resize2tensor(face, inSlice); request.set_input_tensor(ov::Tensor{ inTensor, {0, 0, 0, 0}, {1, inShape[1], inShape[2], inShape[3]} }); request.infer(); face.release(); auto tensor = request.get_output_tensor(); size_t n_lm = tensor.get_shape().at(1); const float* normed_coordinates = tensor.data(); auto begin = 0; auto end = begin + n_lm / 2; for (auto i_lm = begin; i_lm < end; ++i_lm) { float normed_x = normed_coordinates[2 * i_lm]; float normed_y = normed_coordinates[2 * i_lm + 1]; normedLandmarks.push_back(normed_x); normedLandmarks.push_back(normed_y); } return normedLandmarks; } catch (const std::exception& error) { std::cerr << "Error: " << error.what() << std::endl; return normedLandmarks; } } std::shared_ptr FacialLandmarksDetection::read(const ov::Core& core) { std::shared_ptr model = core.read_model(_modelFilePath); ov::Shape outShape = model->output().get_shape(); if (outShape.size() != 2 && outShape.back() != 70) { return model; } ov::preprocess::PrePostProcessor ppp(model); ppp.input().tensor(). set_element_type(ov::element::u8). set_layout("NHWC"); ppp.input().preprocess().convert_layout("NCHW"); ppp.output().tensor().set_element_type(ov::element::f32); model = ppp.build(); inShape = model->input().get_shape(); inShape[0] = ndetections; //ov::set_batch(model, { 1, int64_t(ndetections) }); ov::set_batch(model, { 1 }); // Force single batch for all inputs return model; } //void ANSFRHelper::ANSFRHelper::CheckCudaStatus(cudaError_t status) { // try { // if (status != cudaSuccess) { // std::cerr << "CUDA API failed with status " << status << ": " << cudaGetErrorString(status) << std::endl; // } // } // catch (std::exception& e) { // std::cerr << "ANSFRHelper::CheckCublasStatus" << e.what(); // } //} //void ANSFRHelper::ANSFRHelper::CheckCublasStatus(cublasStatus_t status) { // try { // if (status != CUBLAS_STATUS_SUCCESS) { // std::cerr << "cuBLAS API failed with status " << status << std::endl; // } // } // catch (std::exception& e) { // std::cerr << "ANSFRHelper::CheckCublasStatus" << e.what(); // } //} void ANSFRHelper::GetCroppedFaces(const cv::Mat &input, std::vector