continue to use paddleocr v3 text detection model for large

v5 was not finding text on multi-line plates at all in testing
This commit is contained in:
Josh Hawkins 2025-09-17 14:43:08 -05:00
parent 26178444f3
commit e6ccd40dbb

View File

@ -32,7 +32,7 @@ class PaddleOCRDetection(BaseEmbedding):
device: str = "AUTO",
):
model_file = (
"detection_v5-large.onnx"
"detection_v3-large.onnx"
if model_size == "large"
else "detection_v5-small.onnx"
)
@ -40,7 +40,7 @@ class PaddleOCRDetection(BaseEmbedding):
model_name="paddleocr-onnx",
model_file=model_file,
download_urls={
model_file: f"https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/v5/{model_file}"
model_file: f"https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/{'v3' if model_size == 'large' else 'v5'}/{model_file}"
},
)
self.requestor = requestor