From 1bc77ddb2258bcf9e94088a12b61c98a4239723e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=B0=91=E5=8D=BF?= Date: Tue, 9 Dec 2025 19:30:27 +0800 Subject: [PATCH] Fix: enhance type check robustness with mixed String/Enum types --- deepdoc/parser/mineru_parser.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/deepdoc/parser/mineru_parser.py b/deepdoc/parser/mineru_parser.py index a3ff16866..4161c2310 100644 --- a/deepdoc/parser/mineru_parser.py +++ b/deepdoc/parser/mineru_parser.py @@ -849,7 +849,11 @@ class MinerUParser(RAGFlowPdfParser): return img_root = subdir / "generated_images" img_root.mkdir(parents=True, exist_ok=True) - text_types = {"text", "list", "code", "header"} + text_types = { + "text", "list", "code", "header", "equation", + MinerUContentType.TEXT, MinerUContentType.LIST, MinerUContentType.CODE, + MinerUContentType.HEADER, MinerUContentType.EQUATION + } generated = 0 for idx, item in enumerate(outputs): if item.get("type") not in text_types: