From: Vincent Vanwaelscappel Date: Mon, 4 Aug 2025 13:45:05 +0000 (+0200) Subject: #7678 X-Git-Url: http://git.cubedesigners.com/?a=commitdiff_plain;h=aa9ae1a7410485364d5c5b8b0896233c1845afed;p=cubist_pdf.git #7678 --- diff --git a/resources/tools/docling/convert_page.py b/resources/tools/docling/convert_page.py index d91230a..86d4f7a 100644 --- a/resources/tools/docling/convert_page.py +++ b/resources/tools/docling/convert_page.py @@ -21,13 +21,5 @@ converter = DocumentConverter( } ) result = converter.convert(sys.argv[1]) -allpages=result.document.export_to_markdown(page_break_placeholder="", image_mode=ImageRefMode.EMBEDDED); -Path(sys.argv[2]+"document.md").write_text(allpages) -i=0 -for md in allpages.split(""): - i+=1 - while os.stat(Path(sys.argv[2] + "/../texts/fh"+str(i)+".html")).st_size < 21: - Path(sys.argv[2]+"p"+str(i)+".md").write_text("") - i+=1 - Path(sys.argv[2]+"p"+str(i)+".md").write_text(md) +Path(sys.argv[2]).write_text(result.document.export_to_markdown(image_mode=ImageRefMode.EMBEDDED))