diff --git a/backend/app/services/ocr_to_unified_converter.py b/backend/app/services/ocr_to_unified_converter.py index b94874d..721eed4 100644 --- a/backend/app/services/ocr_to_unified_converter.py +++ b/backend/app/services/ocr_to_unified_converter.py @@ -543,6 +543,13 @@ class OCRToUnifiedConverter: html = elem_data.get('html', '') extracted_text = elem_data.get('extracted_text', '') + # Fallback: check content field for HTML table if html field is empty + if not html: + content = elem_data.get('content', '') + if isinstance(content, str) and '