report-detect/scripts/test_ocr_single.py

38 lines
1.2 KiB
Python
Raw Normal View History

2026-02-05 13:57:22 +08:00
#!/usr/bin/env python
# -*- coding: utf-8 -*-
"""
Test OCR on single image
"""
import sys
import os
def test_ocr(image_path):
print(f"Loading {image_path}...", file=sys.stderr)
try:
os.environ["DISABLE_MODEL_SOURCE_CHECK"] = "True"
from paddleocr import TextRecognition
text_rec = TextRecognition(model_name="PP-OCRv4_server_rec")
output = text_rec.predict(image_path, batch_size=1)
with open("ocr_debug.txt", "w", encoding="utf-8") as f:
f.write("Raw Output:\n")
if isinstance(output, list):
f.write(f"Output is list of length {len(output)}\n")
for i, res in enumerate(output):
f.write(f"Item {i} type: {type(res)}\n")
f.write(f"Item {i} dir: {dir(res)}\n")
f.write(f"Item {i} repr: {res}\n")
else:
f.write(f"Output type: {type(output)}\n")
f.write(str(output) + "\n")
except Exception as e:
print(f"Error: {e}", file=sys.stderr)
if __name__ == "__main__":
if len(sys.argv) < 2:
print("Usage: python test_ocr_single.py <image_path>")
sys.exit(1)
test_ocr(sys.argv[1])