Files
ANSCORE/modules/ANSOCR/ANSONNXOCR/PaddleOCRV5Engine.h

101 lines
3.6 KiB
C
Raw Normal View History

2026-03-28 16:54:11 +11:00
#pragma once
#include "ONNXOCRTypes.h"
#include "ONNXOCRDetector.h"
#include "ONNXOCRClassifier.h"
#include "ONNXOCRRecognizer.h"
#include <memory>
#include <mutex>
2026-04-13 20:38:40 +10:00
#include <atomic>
#include <chrono>
#include <thread>
2026-03-28 16:54:11 +11:00
#include <string>
#include <vector>
namespace ANSCENTER {
namespace onnxocr {
// PaddleOCR V5 pipeline engine: Detection -> (Classification) -> Recognition
// Mirrors the PaddleOCR::PPOCR interface for drop-in replacement
class PaddleOCRV5Engine {
public:
PaddleOCRV5Engine() = default;
~PaddleOCRV5Engine() = default;
// Initialize the OCR pipeline
// clsModelPath can be empty to skip classification
bool Initialize(const std::string& detModelPath,
const std::string& clsModelPath,
const std::string& recModelPath,
const std::string& dictPath);
// Run full OCR pipeline on an image
// Returns results matching PaddleOCR::OCRPredictResult format
std::vector<OCRPredictResult> ocr(const cv::Mat& img);
// Run recognizer only on a pre-cropped text image (no detection step)
TextLine recognizeOnly(const cv::Mat& croppedImage);
2026-03-28 16:54:11 +11:00
// Configuration setters (matching OCRModelConfig parameters)
void SetDetMaxSideLen(int val) { _maxSideLen = val; }
void SetDetDbThresh(float val) { _detDbThresh = val; }
void SetDetBoxThresh(float val) { _detBoxThresh = val; }
void SetDetUnclipRatio(float val) { _detUnclipRatio = val; }
void SetClsThresh(float val) { _clsThresh = val; }
void SetUseDilation(bool val) { _useDilation = val; }
private:
std::unique_ptr<ONNXOCRDetector> detector_;
std::unique_ptr<ONNXOCRClassifier> classifier_; // nullptr if not used
std::unique_ptr<ONNXOCRRecognizer> recognizer_;
std::recursive_mutex _mutex;
2026-04-13 20:38:40 +10:00
std::atomic<bool> _modelLoading{ false };
// RAII helper: sets _modelLoading=true on construction, false on destruction.
struct ModelLoadingGuard {
std::atomic<bool>& flag;
explicit ModelLoadingGuard(std::atomic<bool>& f) : flag(f) { flag.store(true); }
~ModelLoadingGuard() { flag.store(false); }
ModelLoadingGuard(const ModelLoadingGuard&) = delete;
ModelLoadingGuard& operator=(const ModelLoadingGuard&) = delete;
};
// Try to lock _mutex with a timeout. Returns a unique_lock that
// evaluates to true on success.
std::unique_lock<std::recursive_mutex> TryLockWithTimeout(
const char* caller, unsigned int timeoutMs = 5000)
{
const auto deadline = std::chrono::steady_clock::now()
+ std::chrono::milliseconds(timeoutMs);
std::unique_lock<std::recursive_mutex> lk(_mutex, std::defer_lock);
while (!lk.try_lock()) {
if (std::chrono::steady_clock::now() >= deadline) {
std::cerr << "[" << caller << "] Mutex acquisition timed out after "
<< timeoutMs << " ms"
<< (_modelLoading.load() ? " (model loading in progress)" : "")
<< std::endl;
return lk; // unlocked
}
std::this_thread::sleep_for(std::chrono::milliseconds(1));
}
return lk; // locked
}
2026-03-28 16:54:11 +11:00
// Detection parameters
int _maxSideLen = kDetMaxSideLen;
float _detDbThresh = kDetDbThresh;
float _detBoxThresh = kDetBoxThresh;
float _detUnclipRatio = kDetUnclipRatio;
bool _useDilation = false;
// Classifier parameters
float _clsThresh = kClsThresh;
bool _initialized = false;
};
} // namespace onnxocr
} // namespace ANSCENTER