feat: upgrade PP-StructureV3 models to latest versions

- Layout: PP-DocLayout-S → PP-DocLayout_plus-L (83.2% mAP) - Table: Single model → Dual SLANeXt (wired/wireless) - Formula: PP-FormulaNet_plus-L for enhanced recognition - Add preprocessing flags support (orientation, unwarping) - Update frontend i18n descriptions 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-11-27 14:21:24 +08:00
parent 59206a6ab8
commit 6235280c45
9 changed files with 504 additions and 25 deletions
--- a/backend/app/schemas/task.py
+++ b/backend/app/schemas/task.py
@@ -28,11 +28,11 @@ class LayoutModelEnum(str, Enum):
    """Layout detection model selection for OCR track.

    Different models are optimized for different document types:
-    - CHINESE: PP-DocLayout-S, optimized for Chinese documents (forms, contracts, invoices)
-    - DEFAULT: PubLayNet-based, optimized for English academic papers
-    - CDLA: CDLA model, specialized Chinese document layout analysis
+    - CHINESE: PP-DocLayout_plus-L (83.2% mAP), optimized for complex Chinese documents
+    - DEFAULT: PubLayNet-based (~94% mAP), optimized for English academic papers
+    - CDLA: CDLA model (~86% mAP), specialized Chinese document layout analysis
    """
-    CHINESE = "chinese"   # PP-DocLayout-S - Best for Chinese documents (recommended)
+    CHINESE = "chinese"   # PP-DocLayout_plus-L - Best for Chinese documents (recommended)
    DEFAULT = "default"   # PubLayNet-based - Best for English documents
    CDLA = "cdla"         # CDLA model - Alternative for Chinese layout