From 65519b08ca1301d783097a6d70186ebd4be9561a Mon Sep 17 00:00:00 2001 From: Michele Dolfi Date: Fri, 31 Jan 2025 17:03:56 +0100 Subject: [PATCH] markdown placeholder Signed-off-by: Michele Dolfi --- docling_core/types/doc/document.py | 17 ++++++++++++----- 1 file changed, 12 insertions(+), 5 deletions(-) diff --git a/docling_core/types/doc/document.py b/docling_core/types/doc/document.py index cfa82c4..b0e1007 100644 --- a/docling_core/types/doc/document.py +++ b/docling_core/types/doc/document.py @@ -2227,11 +2227,18 @@ def _append_text(text: str, do_escape_html=True, do_escape_underscores=True): elif isinstance(item, TextItem) and item.label in [DocItemLabel.FORMULA]: in_list = False - _append_text( - f"$${item.text}$$\n", - do_escape_underscores=False, - do_escape_html=False, - ) + if item.text != "": + _append_text( + f"$${item.text}$$\n", + do_escape_underscores=False, + do_escape_html=False, + ) + elif item.orig != "": + _append_text( + "\n", + do_escape_underscores=False, + do_escape_html=False, + ) elif isinstance(item, TextItem) and item.label in labels: in_list = False