Gracefully handle missing PaddleOCRVL

2026-03-19 15:02:01 +08:00 · 2026-03-19 15:02:01 +08:00 · 9ef41799c9
parent b5baaa38c3
commit 9ef41799c9
2 changed files with 74 additions and 54 deletions
--- a/python_api/ocr_api_server.py
+++ b/python_api/ocr_api_server.py
@ -16,7 +16,11 @@ import logging
 import traceback
 from pathlib import Path
 from flask import Flask, request, jsonify
-from paddleocr import PaddleOCR, PaddleOCRVL
+from paddleocr import PaddleOCR
 try:
    from paddleocr import PaddleOCRVL  # type: ignore
 except Exception:
    PaddleOCRVL = None
 # 配置日志
 logging.basicConfig(
@ -93,26 +97,30 @@ def init_models():
    logger.info("=" * 60)
    logger.info("正在初始化 PaddleOCRVL...")
    logger.info("=" * 60)
-    try:
+    if PaddleOCRVL is None:
-        vl_kwargs = {
+        logger.warning("PaddleOCRVL not available in installed paddleocr. Skipping VL pipeline.")
            "use_seal_recognition": True,
            "use_ocr_for_image_block": True,
            "use_layout_detection": True,
            "use_doc_orientation_classify": False,
            "use_doc_unwarping": False,
        }
        if layout_dir:
            vl_kwargs["layout_detection_model_dir"] = str(layout_dir)
            vl_kwargs["layout_detection_model_name"] = "PP-DocLayoutV3"
        if vl_rec_dir:
            vl_kwargs["vl_rec_model_dir"] = str(vl_rec_dir)
            vl_kwargs["vl_rec_model_name"] = "PaddleOCR-VL-1.5-0.9B"
        vl_pipeline = PaddleOCRVL(**vl_kwargs)
        logger.info("✅ PaddleOCRVL 初始化成功")
    except Exception as e:
        logger.error(f"❌ PaddleOCRVL 初始化失败: {e}", exc_info=True)
        vl_pipeline = None
    else:
        try:
            vl_kwargs = {
                "use_seal_recognition": True,
                "use_ocr_for_image_block": True,
                "use_layout_detection": True,
                "use_doc_orientation_classify": False,
                "use_doc_unwarping": False,
            }
            if layout_dir:
                vl_kwargs["layout_detection_model_dir"] = str(layout_dir)
                vl_kwargs["layout_detection_model_name"] = "PP-DocLayoutV3"
            if vl_rec_dir:
                vl_kwargs["vl_rec_model_dir"] = str(vl_rec_dir)
                vl_kwargs["vl_rec_model_name"] = "PaddleOCR-VL-1.5-0.9B"
            vl_pipeline = PaddleOCRVL(**vl_kwargs)
            logger.info("✅ PaddleOCRVL 初始化成功")
        except Exception as e:
            logger.error(f"❌ PaddleOCRVL 初始化失败: {e}", exc_info=True)
            vl_pipeline = None
    # 初始化 PP-OCRv5
    logger.info("=" * 60)
@ -220,10 +228,11 @@ def ocr_pdf():
        # 处理 PDF（传递 verbose 参数）
        try:
            ocr_model = 'paddleocr_vl' if vl_pipeline else 'ppocr_v5'
            result = process_single_pdf_standalone(
                Path(pdf_path),
                Path(output_dir),
-                ocr_model='paddleocr_vl',
+                ocr_model=ocr_model,
                vl_pipeline=vl_pipeline,
                verbose=verbose  # 新增：传递verbose参数
            )
@ -298,12 +307,13 @@ def ocr_image():
            return jsonify({'success': False, 'error': f'Image not found: {image_path}'}), 404
        logger.info(f"处理图像: {image_path}")
-
+        # Use PaddleOCRVL if available, otherwise fallback to PaddleOCR
-        # 使用 PaddleOCRVL 识别
+        if vl_pipeline:
-        if not vl_pipeline:
+            result = vl_pipeline.ocr(image_path)
-            return jsonify({'success': False, 'error': 'PaddleOCRVL not initialized'}), 500
+        else:
-
+            if not ocr_pipeline:
-        result = vl_pipeline.ocr(image_path)
+                return jsonify({'success': False, 'error': 'OCR pipeline not initialized'}), 500
            result = ocr_pipeline.ocr(image_path)
        # 提取文本
        texts = []
--- a/src/main/resources/python-api/ocr_api_server.py
+++ b/src/main/resources/python-api/ocr_api_server.py
@ -15,7 +15,11 @@ import json
 import logging
 from pathlib import Path
 from flask import Flask, request, jsonify
-from paddleocr import PaddleOCR, PaddleOCRVL
+from paddleocr import PaddleOCR
 try:
    from paddleocr import PaddleOCRVL  # type: ignore
 except Exception:
    PaddleOCRVL = None
 # 配置日志
 logging.basicConfig(
@ -92,26 +96,30 @@ def init_models():
    logger.info("=" * 60)
    logger.info("正在初始化 PaddleOCRVL...")
    logger.info("=" * 60)
-    try:
+    if PaddleOCRVL is None:
-        vl_kwargs = {
+        logger.warning("PaddleOCRVL not available in installed paddleocr. Skipping VL pipeline.")
            "use_seal_recognition": True,
            "use_ocr_for_image_block": True,
            "use_layout_detection": True,
            "use_doc_orientation_classify": False,
            "use_doc_unwarping": False,
        }
        if layout_dir:
            vl_kwargs["layout_detection_model_dir"] = str(layout_dir)
            vl_kwargs["layout_detection_model_name"] = "PP-DocLayoutV3"
        if vl_rec_dir:
            vl_kwargs["vl_rec_model_dir"] = str(vl_rec_dir)
            vl_kwargs["vl_rec_model_name"] = "PaddleOCR-VL-1.5-0.9B"
        vl_pipeline = PaddleOCRVL(**vl_kwargs)
        logger.info("✅ PaddleOCRVL 初始化成功")
    except Exception as e:
        logger.error(f"❌ PaddleOCRVL 初始化失败: {e}", exc_info=True)
        vl_pipeline = None
    else:
        try:
            vl_kwargs = {
                "use_seal_recognition": True,
                "use_ocr_for_image_block": True,
                "use_layout_detection": True,
                "use_doc_orientation_classify": False,
                "use_doc_unwarping": False,
            }
            if layout_dir:
                vl_kwargs["layout_detection_model_dir"] = str(layout_dir)
                vl_kwargs["layout_detection_model_name"] = "PP-DocLayoutV3"
            if vl_rec_dir:
                vl_kwargs["vl_rec_model_dir"] = str(vl_rec_dir)
                vl_kwargs["vl_rec_model_name"] = "PaddleOCR-VL-1.5-0.9B"
            vl_pipeline = PaddleOCRVL(**vl_kwargs)
            logger.info("✅ PaddleOCRVL 初始化成功")
        except Exception as e:
            logger.error(f"❌ PaddleOCRVL 初始化失败: {e}", exc_info=True)
            vl_pipeline = None
    # 初始化 PP-OCRv5
    logger.info("=" * 60)
@ -219,10 +227,11 @@ def ocr_pdf():
        # 处理 PDF（传递 verbose 参数）
        try:
            ocr_model = 'paddleocr_vl' if vl_pipeline else 'ppocr_v5'
            result = process_single_pdf_standalone(
                Path(pdf_path),
                Path(output_dir),
-                ocr_model='paddleocr_vl',
+                ocr_model=ocr_model,
                vl_pipeline=vl_pipeline,
                verbose=verbose  # 新增：传递verbose参数
            )
@ -280,12 +289,13 @@ def ocr_image():
            return jsonify({'success': False, 'error': f'Image not found: {image_path}'}), 404
        logger.info(f"处理图像: {image_path}")
-
+        # Use PaddleOCRVL if available, otherwise fallback to PaddleOCR
-        # 使用 PaddleOCRVL 识别
+        if vl_pipeline:
-        if not vl_pipeline:
+            result = vl_pipeline.ocr(image_path)
-            return jsonify({'success': False, 'error': 'PaddleOCRVL not initialized'}), 500
+        else:
-
+            if not ocr_pipeline:
-        result = vl_pipeline.ocr(image_path)
+                return jsonify({'success': False, 'error': 'OCR pipeline not initialized'}), 500
            result = ocr_pipeline.ocr(image_path)
        # 提取文本
        texts = []